feat3/burgers__assembler_8cpp_source.html

// FEAT3: Finite Element Analysis Toolbox, Version 3

// Copyright (C) 2010 by Stefan Turek & the FEAT group

// FEAT3 is released under the GNU General Public License version 3,

// see the file 'copyright.txt' in the top level directory for details.


#include <kernel/voxel_assembly/burgers_assembler.hpp>

#include <kernel/lafem/matrix_gather_scatter_helper.hpp>

#include <kernel/lafem/vector_gather_scatter_helper.hpp>

#include <kernel/util/math.hpp>

#include <kernel/lafem/vector_mirror.hpp>

#include <kernel/global/vector.hpp>


namespace FEAT

{

  namespace VoxelAssembly

  {

    namespace Kernel

    {


      template<typename Space_, typename DT_, typename IT_, FEAT::Intern::MatrixGatherScatterPolicy pol_ = FEAT::Intern::MatrixGatherScatterPolicy::useLocalOps>

      void full_burgers_assembler_matrix1_bcsr_host(DT_* matrix_data, const DT_* conv_data,

                const IT_*  matrix_row_ptr, const IT_* matrix_col_idx, Index matrix_num_rows, Index matrix_num_cols,

                const Tiny::Vector<DT_, Space_::world_dim>* cub_pt,

                const DT_*  cub_wg, int num_cubs, DT_ alpha,

                const IT_* cell_to_dof, [[maybe_unused]] Index cell_num,

                const Tiny::Vector<DT_, Space_::world_dim>* nodes, [[maybe_unused]] Index node_size,

                const int* coloring_map, Index coloring_size, const IT_* cell_to_dof_sorter,

                const VoxelAssembly::AssemblyBurgersData<DT_>& burgers_params)

      {

        //define types

        typedef Space_ SpaceType;

        typedef DT_ DataType;

        typedef IT_ IndexType;


        const DataType& beta{burgers_params.beta};

        const DataType& sd_delta{burgers_params.sd_delta};

        const DataType& sd_v_norm{burgers_params.sd_v_norm};


        const DataType tol_eps = Math::sqrt(Math::eps<DataType>());

        // const DataType tol_eps = CudaMath::cuda_sqrt(DBL_EPSILON);

        // const DataType tol_eps = DBL_EPSILON;

        const bool need_streamline = (Math::abs(sd_delta) > DataType(0)) && (sd_v_norm > tol_eps);

        const bool need_convection = Math::abs(beta) > DataType(0);


        typedef VoxelAssembly::SpaceHelper<SpaceType, DT_, IT_> SpaceHelp;


        constexpr int dim = SpaceHelp::dim;


        //define local sizes

        constexpr int num_loc_dofs = SpaceType::DofMappingType::dof_count;

        //get number of nodes per element

        constexpr int num_loc_verts = SpaceType::MeshType::template IndexSet<dim, 0>::Type::num_indices;


        //our local datatypes

        typedef Tiny::Vector<DataType, dim> VecValueType;

        typedef Tiny::Matrix<DataType, dim, dim> MatValueType;

        typedef Tiny::Vector<VecValueType, num_loc_dofs> LocalVectorType;

        typedef Tiny::Matrix<MatValueType, num_loc_dofs, num_loc_dofs> LocalMatrixType;


        FEAT_PRAGMA_OMP(parallel for)

        for(Index idx = 0; idx < coloring_size; ++idx)

        {

          // define local coefficients

          Tiny::Matrix<DataType, dim, num_loc_verts> local_coeffs;

          // and local matrix

          LocalMatrixType loc_mat;

          LocalVectorType local_conv_dofs(DataType(0));

          // now do work for this cell

          IndexType cell = IndexType(coloring_map[idx]);

          // std::cout << "Starting with cell " << cell << "\n";

          const IndexSetWrapper<IndexType> local_dofs_w{cell_to_dof, IndexType(num_loc_dofs)};

          const IndexType* local_dofs = cell_to_dof + cell*num_loc_dofs;

          const IndexType* local_dof_sorter = cell_to_dof_sorter + cell*num_loc_dofs;


          SpaceHelp::set_coefficients(local_coeffs, local_dofs_w, nodes, cell);

          //if we need to, gather local convection vector

          if(need_convection || need_streamline) //need stream diff or convection?

          {

            LAFEM::template VectorGatherScatterHelper<SpaceType, DataType, IndexType>::gather_vector_dense(local_conv_dofs,

                      (const VecValueType*)conv_data, IndexType(matrix_num_rows), local_dofs,DataType(1));

          }


          VoxelAssembly::Kernel::burgers_mat_assembly_kernel<SpaceHelp>(loc_mat, local_conv_dofs, local_coeffs, cub_pt, cub_wg, num_cubs, burgers_params,

                                      need_streamline, need_convection, tol_eps);


          //scatter

          LAFEM::template MatrixGatherScatterHelper<SpaceType, DataType, IndexType, pol_>::scatter_matrix_csr(loc_mat, (MatValueType*)matrix_data, local_dofs, local_dofs, IndexType(matrix_num_rows), IndexType(matrix_num_cols), matrix_row_ptr, matrix_col_idx, alpha, local_dof_sorter);


        }

      }


      template<typename Space_, typename DT_, typename IT_>

      void full_burgers_assembler_vector_bd_host(DT_* vector_data,

                const DT_* conv_data, const DT_* primal_data, Index vec_size,

                const Tiny::Vector<DT_, Space_::world_dim>* cub_pt,

                const DT_*  cub_wg, int num_cubs, DT_ alpha,

                const IT_* cell_to_dof, [[maybe_unused]] Index cell_num,

                const Tiny::Vector<DT_, Space_::world_dim>* nodes, [[maybe_unused]] Index node_size,

                const int* coloring_map, Index coloring_size,

                const VoxelAssembly::AssemblyBurgersData<DT_>& burgers_params)

      {

        //define types

        typedef Space_ SpaceType;

        typedef DT_ DataType;

        typedef IT_ IndexType;


        const DataType& beta{burgers_params.beta};


        const bool need_convection = Math::abs(beta) > DataType(0);


        typedef VoxelAssembly::SpaceHelper<SpaceType, DT_, IT_> SpaceHelp;


        constexpr int dim = SpaceHelp::dim;


        //define local sizes

        constexpr int num_loc_dofs = SpaceType::DofMappingType::dof_count;

        //get number of nodes per element

        constexpr int num_loc_verts = SpaceType::MeshType::template IndexSet<dim, 0>::Type::num_indices;


        //our local datatypes

        typedef Tiny::Vector<DataType, dim> VecValueType;

        // typedef Tiny::Matrix<DataType, dim, dim> MatValueType;

        typedef Tiny::Vector<VecValueType, num_loc_dofs> LocalVectorType;

        // typedef Tiny::Matrix<MatValueType, num_loc_dofs, num_loc_dofs> LocalMatrixType;


        FEAT_PRAGMA_OMP(parallel for)

        for(Index idx = 0; idx < coloring_size; ++idx)

        {

          //define local array

          LocalVectorType loc_vec(DataType(0));

          LocalVectorType local_conv_dofs(DataType(0));

          LocalVectorType local_prim_dofs(DataType(0));

          // typename NewSpaceHelp::ImagePointType img_point;

          Tiny::Matrix<DataType, dim, num_loc_verts> local_coeffs;


          //now do work for this cell

          IndexType cell = IndexType(coloring_map[idx]);

          const IndexSetWrapper<IndexType> local_dofs_w{cell_to_dof, IndexType(num_loc_dofs)};

          const IndexType* local_dofs = cell_to_dof + cell*num_loc_dofs;

          SpaceHelp::set_coefficients(local_coeffs, local_dofs_w, nodes, cell);

          LAFEM::template VectorGatherScatterHelper<SpaceType, DataType, IndexType>::gather_vector_dense(local_prim_dofs,

                    (const VecValueType*)primal_data, IndexType(vec_size), local_dofs, DataType(1));


          //if we need to, gather local convection vector

          if(need_convection) //need stream diff or convection?

          {

            LAFEM::template VectorGatherScatterHelper<SpaceType, DataType, IndexType>::gather_vector_dense(local_conv_dofs,

                      (const VecValueType*)conv_data, IndexType(vec_size), local_dofs, DataType(1));

          }


          VoxelAssembly::Kernel::burgers_defect_assembly_kernel<SpaceHelp>(loc_vec, local_prim_dofs, local_conv_dofs, local_coeffs, cub_pt, cub_wg, num_cubs,

                                                         burgers_params, need_convection);

          //scatter

          LAFEM::template VectorGatherScatterHelper<SpaceType, DataType, IndexType>::scatter_vector_dense(loc_vec,

                    (VecValueType*)vector_data, IndexType(vec_size), local_dofs, alpha);


        }

      }


      template<typename DT_, int dim_>

      void set_sd_v_norm_host(const Tiny::Vector<DT_, dim_>* convect, DT_* result, Index vec_size)

      {

        DT_ max_val(DT_(0));

        // simply reduce over max_val

        FEAT_PRAGMA_OMP(parallel for reduction(max : max_val))

        for(int i = 0; i < int(vec_size); ++i)

        {

          //synchronize all threads in block, to guarentee that all values are written

          max_val = Math::max(convect[i].norm_euclid(), max_val);

        }

        //and overwrite

        *result = max_val;


      }


    }


    namespace Arch

    {

      template<typename Space_, typename DT_, typename IT_>

      void assemble_burgers_csr_host([[maybe_unused]]const Space_& space,

              const CSRMatrixData<DT_, IT_>& matrix_data,

              const DT_* conv_data,

              const AssemblyCubatureData<DT_>& cubature,

              const AssemblyMappingData<DT_, IT_>& dof_mapping,

              const std::vector<int*>& coloring_maps,

              const std::vector<Index>& coloring_map_sizes,

              DT_ alpha, const AssemblyBurgersData<DT_>& burgers_params)

      {

        for(Index col = 0; col < Index(coloring_maps.size()); ++col)

        {

          VoxelAssembly::Kernel::template full_burgers_assembler_matrix1_bcsr_host<Space_, DT_, IT_, FEAT::Intern::MatrixGatherScatterPolicy::useLocalSortHelper>(

              matrix_data.data, conv_data, matrix_data.row_ptr, matrix_data.col_idx, matrix_data.num_rows, matrix_data.num_cols,

              (const typename Tiny::Vector<DT_, Space_::world_dim>*) cubature.cub_pt,

              cubature.cub_wg, cubature.num_cubs, alpha,

              dof_mapping.cell_to_dof, dof_mapping.cell_num,

              (const typename Tiny::Vector<DT_, Space_::world_dim>*) dof_mapping.nodes, dof_mapping.node_size,

              (const int*) coloring_maps[col], coloring_map_sizes[col], dof_mapping.cell_to_dof_sorter,

              burgers_params

          );

        }


      }


      template<typename Space_, typename DT_, typename IT_>

      void assemble_burgers_defect_host([[maybe_unused]] const Space_& space,

              DT_* vector_data,

              const DT_* conv_data,

              const DT_* primal_data,

              const AssemblyCubatureData<DT_>& cubature,

              const AssemblyMappingData<DT_, IT_>& dof_mapping,

              const std::vector<int*>& coloring_maps,

              const std::vector<Index>& coloring_map_sizes,

              DT_ alpha, const AssemblyBurgersData<DT_>& burgers_params)

      {

        for(Index col = 0; col < Index(coloring_maps.size()); ++col)

        {

          VoxelAssembly::Kernel::template full_burgers_assembler_vector_bd_host<Space_, DT_, IT_>(vector_data, conv_data, primal_data,

              space.get_num_dofs(), (const typename Tiny::Vector<DT_, Space_::world_dim>*) cubature.cub_pt,

              cubature.cub_wg, cubature.num_cubs, alpha,

              dof_mapping.cell_to_dof, dof_mapping.cell_num,

              (const typename Tiny::Vector<DT_, Space_::world_dim>*) dof_mapping.nodes, dof_mapping.node_size,

              (const int*) coloring_maps[col], coloring_map_sizes[col], burgers_params

          );

        }

      }


      template<typename DT_, typename IT_, int dim_>

      DT_ get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<DT_, IT_, dim_>& convect)

      {

        //extract pointer

        const Tiny::Vector<DT_, dim_>* vec_data = (const Tiny::Vector<DT_, dim_>*)convect.template elements<LAFEM::Perspective::native>();


        DT_ glob_res = DT_(0);


        VoxelAssembly::Kernel::template set_sd_v_norm_host<DT_, dim_>(vec_data, &glob_res, convect.template size<LAFEM::Perspective::native>());


        return glob_res;

      }


      template<typename DT_, typename IT_, int dim_>

      DT_ get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<DT_, IT_, dim_>, LAFEM::VectorMirror<DT_, IT_>>& convect)

      {

        auto local_norm = get_sd_v_norm_host(convect.local());

        const auto* gate = convect.get_gate();

        if(gate != nullptr)

        {

          local_norm = gate->max(local_norm);

        }

        return local_norm;

      }

    }

  }

}


//instantiate the templates

using namespace FEAT;

using namespace FEAT::VoxelAssembly;


/*******************************************************2D implementations***************************************************/

template void Arch::assemble_burgers_csr_host(const Q2StandardQuad&, const CSRMatrixData<double, std::uint32_t>&, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardQuad&, const CSRMatrixData<float, std::uint32_t>&, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardQuad&, const CSRMatrixData<double, std::uint64_t>&, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardQuad&, const CSRMatrixData<float, std::uint64_t>&, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

#ifdef FEAT_HAVE_HALFMATH

template void Arch::assemble_burgers_csr_host(const Q2StandardQuad&, const CSRMatrixData<Half, std::uint32_t>&, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardQuad&, const CSRMatrixData<Half, std::uint64_t>&, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

#endif


template void Arch::assemble_burgers_defect_host(const Q2StandardQuad&, double*, const double*, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardQuad&, float*, const float*, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardQuad&, double*, const double*, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardQuad&, float*, const float*, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

#ifdef FEAT_HAVE_HALFMATH

template void Arch::assemble_burgers_defect_host(const Q2StandardQuad&, Half*, const Half*, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardQuad&, Half*, const Half*, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

#endif


template double Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<double, std::uint32_t, 2>&);

template float Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<float, std::uint32_t, 2>&);

template double Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<double, std::uint64_t, 2>&);

template float Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<float, std::uint64_t, 2>&);

#ifdef FEAT_HAVE_HALFMATH

template Half Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<Half, std::uint32_t, 2>&);

template Half Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<Half, std::uint64_t, 2>&);

#endif


template double Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<double, std::uint32_t, 2>, LAFEM::VectorMirror<double, std::uint32_t>>&);

template float Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<float, std::uint32_t, 2>, LAFEM::VectorMirror<float, std::uint32_t>>&);

template double Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<double, std::uint64_t, 2>, LAFEM::VectorMirror<double, std::uint64_t>>&);

template float Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<float, std::uint64_t, 2>, LAFEM::VectorMirror<float, std::uint64_t>>&);

#ifdef FEAT_HAVE_HALFMATH

template Half Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<Half, std::uint32_t, 2>, LAFEM::VectorMirror<Half, std::uint32_t>>&);

template Half Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<Half, std::uint64_t, 2>, LAFEM::VectorMirror<Half, std::uint64_t>>&);

#endif


/*********************************************************3D implementations**************************************************************************************/

template void Arch::assemble_burgers_csr_host(const Q2StandardHexa&, const CSRMatrixData<double, std::uint32_t>&, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardHexa&, const CSRMatrixData<float, std::uint32_t>&, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardHexa&, const CSRMatrixData<double, std::uint64_t>&, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardHexa&, const CSRMatrixData<float, std::uint64_t>&, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

#ifdef FEAT_HAVE_HALFMATH

template void Arch::assemble_burgers_csr_host(const Q2StandardHexa&, const CSRMatrixData<Half, std::uint32_t>&, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

template void Arch::assemble_burgers_csr_host(const Q2StandardHexa&, const CSRMatrixData<Half, std::uint64_t>&, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

#endif


template void Arch::assemble_burgers_defect_host(const Q2StandardHexa&, double*, const double*, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardHexa&, float*, const float*, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardHexa&, double*, const double*, const double*, const AssemblyCubatureData<double>&, const AssemblyMappingData<double, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, double, const AssemblyBurgersData<double>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardHexa&, float*, const float*, const float*, const AssemblyCubatureData<float>&, const AssemblyMappingData<float, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, float, const AssemblyBurgersData<float>&);

#ifdef FEAT_HAVE_HALFMATH

template void Arch::assemble_burgers_defect_host(const Q2StandardHexa&, Half*, const Half*, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint32_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

template void Arch::assemble_burgers_defect_host(const Q2StandardHexa&, Half*, const Half*, const Half*, const AssemblyCubatureData<Half>&, const AssemblyMappingData<Half, std::uint64_t>&,

                                          const std::vector<int*>&, const std::vector<Index>&, Half, const AssemblyBurgersData<Half>&);

#endif


template double Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<double, std::uint32_t, 3>&);

template float Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<float, std::uint32_t, 3>&);

template double Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<double, std::uint64_t, 3>&);

template float Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<float, std::uint64_t, 3>&);

#ifdef FEAT_HAVE_HALFMATH

template Half Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<Half, std::uint32_t, 3>&);

template Half Arch::get_sd_v_norm_host(const LAFEM::DenseVectorBlocked<Half, std::uint64_t, 3>&);

#endif


template double Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<double, std::uint32_t, 3>, LAFEM::VectorMirror<double, std::uint32_t>>&);

template float Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<float, std::uint32_t, 3>, LAFEM::VectorMirror<float, std::uint32_t>>&);

template double Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<double, std::uint64_t, 3>, LAFEM::VectorMirror<double, std::uint64_t>>&);

template float Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<float, std::uint64_t, 3>, LAFEM::VectorMirror<float, std::uint64_t>>&);

#ifdef FEAT_HAVE_HALFMATH

template Half Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<Half, std::uint32_t, 3>, LAFEM::VectorMirror<Half, std::uint32_t>>&);

template Half Arch::get_sd_v_norm_host(const Global::Vector<LAFEM::DenseVectorBlocked<Half, std::uint64_t, 3>, LAFEM::VectorMirror<Half, std::uint64_t>>&);

#endif

FEAT::Global::Vector
Global vector wrapper class template.
Definition: vector.hpp:68

FEAT::LAFEM::DenseVectorBlocked
Blocked Dense data vector class template.
Definition: dense_vector_blocked.hpp:81

FEAT::LAFEM::VectorMirror
Handles vector prolongation, restriction and serialization.
Definition: vector_mirror.hpp:52

FEAT::Space::Lagrange2::Element
Standard Lagrange-2 Finite-Element space class template.
Definition: element.hpp:39

FEAT::Tiny::Matrix
Tiny Matrix class template.
Definition: tiny_algebra.hpp:80

FEAT::Tiny::Vector
Tiny Vector class template.
Definition: tiny_algebra.hpp:52

FEAT::VoxelAssembly::IndexSetWrapper
Definition: space_helper.hpp:26

FEAT::Math::sqrt
T_ sqrt(T_ x)
Returns the square-root of a value.
Definition: math.hpp:300

FEAT::Math::abs
T_ abs(T_ x)
Returns the absolute value.
Definition: math.hpp:275

FEAT::Math::max
T_ max(T_ a, T_ b)
Returns the maximum of two values.
Definition: math.hpp:137

FEAT::VoxelAssembly::Arch::assemble_burgers_defect_host
void assemble_burgers_defect_host(const Space_ &space, DT_ *vector_data, const DT_ *conv_data, const DT_ *primal_data, const AssemblyCubatureData< DT_ > &cubature, const AssemblyMappingData< DT_, IT_ > &dof_mapping, const std::vector< int * > &coloring_maps, const std::vector< Index > &coloring_map_sizes, DT_ alpha, const AssemblyBurgersData< DT_ > &burgers_params)
Host kernel wrapper for the defect burgers assembler.
Definition: burgers_assembler.cpp:219

FEAT::VoxelAssembly::Arch::assemble_burgers_csr_host
void assemble_burgers_csr_host(const Space_ &space, const CSRMatrixData< DT_, IT_ > &matrix_data, const DT_ *conv_data, const AssemblyCubatureData< DT_ > &cubature, const AssemblyMappingData< DT_, IT_ > &dof_mapping, const std::vector< int * > &coloring_maps, const std::vector< Index > &coloring_map_sizes, DT_ alpha, const AssemblyBurgersData< DT_ > &burgers_params)
Host kernel wrapper for the full matrix burgers assembler.
Definition: burgers_assembler.cpp:194

FEAT::VoxelAssembly::Arch::get_sd_v_norm_host
DT_ get_sd_v_norm_host(const LAFEM::DenseVectorBlocked< DT_, IT_, dim_ > &convect)
Host kernel wrapper for the local sd_v_norm calculation.
Definition: burgers_assembler.cpp:242

FEAT::VoxelAssembly::Kernel::set_sd_v_norm_host
void set_sd_v_norm_host(const Tiny::Vector< DT_, dim_ > *convect, DT_ *result, Index vec_size)
Reduces the max local vector norm of a convection vector.
Definition: burgers_assembler.cpp:174

FEAT::VoxelAssembly
Namespace for different voxel based assembly methods.
Definition: burgers_assembler.cpp:16

FEAT
FEAT namespace.
Definition: adjactor.hpp:12

FEAT::Half
__half Half
Half data type.
Definition: half.hpp:25

FEAT::Index
std::uint64_t Index
Index data type.
Definition: base_header.hpp:122

FEAT::VoxelAssembly::AssemblyBurgersData
Data for burgers assembler.
Definition: voxel_assembly_common.hpp:111

FEAT::VoxelAssembly::AssemblyCubatureData
A data field for a cubature rule.
Definition: voxel_assembly_common.hpp:79

FEAT::VoxelAssembly::AssemblyCubatureData::cub_wg
const DT_ * cub_wg
The cubature weights.
Definition: voxel_assembly_common.hpp:83

FEAT::VoxelAssembly::AssemblyCubatureData::num_cubs
int num_cubs
Number of cubtaure points.
Definition: voxel_assembly_common.hpp:85

FEAT::VoxelAssembly::AssemblyCubatureData::cub_pt
const void * cub_pt
The cubature point data array.
Definition: voxel_assembly_common.hpp:81

FEAT::VoxelAssembly::AssemblyMappingData
A data field for all necessary values that define the dof mapping for assembly.
Definition: voxel_assembly_common.hpp:59

FEAT::VoxelAssembly::AssemblyMappingData::cell_num
Index cell_num
The number of cells.
Definition: voxel_assembly_common.hpp:65

FEAT::VoxelAssembly::AssemblyMappingData::cell_to_dof
const IT_ * cell_to_dof
The cell to dof, where cell_to_dof[i],..., cell_to_dof[i+cell_dofs-1] are the dofs of one cell.
Definition: voxel_assembly_common.hpp:61

FEAT::VoxelAssembly::AssemblyMappingData::node_size
Index node_size
The number of nodes.
Definition: voxel_assembly_common.hpp:69

FEAT::VoxelAssembly::AssemblyMappingData::cell_to_dof_sorter
const IT_ * cell_to_dof_sorter
Array of sortingindices of cell_to_dof.
Definition: voxel_assembly_common.hpp:63

FEAT::VoxelAssembly::AssemblyMappingData::nodes
const void * nodes
An array of the nodes fitting to the cell_to_dof mapping.
Definition: voxel_assembly_common.hpp:67

FEAT::VoxelAssembly::CSRMatrixData
CSR Matrix data.
Definition: voxel_assembly_common.hpp:96

FEAT::VoxelAssembly::SpaceHelper
Definition: space_helper.hpp:94