terraneo/divergence_8hpp_source.html

#pragma once


#include "../../quadrature/quadrature.hpp"

#include "communication/shell/communication.hpp"

#include "communication/shell/communication_plan.hpp"

#include "dense/vec.hpp"

#include "fe/wedge/integrands.hpp"

#include "fe/wedge/kernel_helpers.hpp"

#include "grid/shell/spherical_shell.hpp"

#include "linalg/operator.hpp"

#include "linalg/trafo/local_basis_trafo_normal_tangential.hpp"

#include "linalg/vector.hpp"

#include "linalg/vector_q1.hpp"

#include "util/timer.hpp"


namespace terra::fe::wedge::operators::shell {


using grid::shell::get_boundary_condition_flag;

using grid::shell::BoundaryConditionFlag::DIRICHLET;

using grid::shell::BoundaryConditionFlag::FREESLIP;

using grid::shell::BoundaryConditionFlag::NEUMANN;

using grid::shell::ShellBoundaryFlag::CMB;

using grid::shell::ShellBoundaryFlag::SURFACE;

using terra::grid::shell::BoundaryConditionFlag;

using terra::grid::shell::BoundaryConditions;

using terra::grid::shell::ShellBoundaryFlag;

using terra::linalg::trafo::trafo_mat_cartesian_to_normal_tangential;


template < typename ScalarT >


class Divergence

{

  public:

    using SrcVectorType = linalg::VectorQ1Vec< ScalarT, 3 >;

    using DstVectorType = linalg::VectorQ1Scalar< ScalarT >;

    using ScalarType    = ScalarT;


  private:

    grid::shell::DistributedDomain domain_fine_;

    grid::shell::DistributedDomain domain_coarse_;


    grid::Grid3DDataVec< ScalarT, 3 >                        grid_fine_;

    grid::Grid2DDataScalar< ScalarT >                        radii_;

    grid::Grid4DDataScalar< grid::shell::ShellBoundaryFlag > boundary_mask_fine_;


    BoundaryConditions bcs_;


    linalg::OperatorApplyMode         operator_apply_mode_;

    linalg::OperatorCommunicationMode operator_communication_mode_;


    communication::shell::SubdomainNeighborhoodSendRecvBuffer< ScalarT >                        recv_buffers_;

    terra::communication::shell::ShellBoundaryCommPlan< grid::Grid4DDataScalar< ScalarT > >    comm_plan_;


    grid::Grid4DDataVec< ScalarType, 3 > src_;

    grid::Grid4DDataScalar< ScalarType > dst_;


  public:


    Divergence(

        const grid::shell::DistributedDomain&                           domain_fine,

        const grid::shell::DistributedDomain&                           domain_coarse,

        const grid::Grid3DDataVec< ScalarT, 3 >&                        grid_fine,

        const grid::Grid2DDataScalar< ScalarT >&                        radii_fine,

        const grid::Grid4DDataScalar< grid::shell::ShellBoundaryFlag >& boundary_mask_fine,

        BoundaryConditions                                              bcs,

        linalg::OperatorApplyMode         operator_apply_mode = linalg::OperatorApplyMode::Replace,

        linalg::OperatorCommunicationMode operator_communication_mode =

            linalg::OperatorCommunicationMode::CommunicateAdditively )

    : domain_fine_( domain_fine )

    , domain_coarse_( domain_coarse )

    , grid_fine_( grid_fine )

    , radii_( radii_fine )

    , boundary_mask_fine_( boundary_mask_fine )

    , operator_apply_mode_( operator_apply_mode )

    , operator_communication_mode_( operator_communication_mode )

    , recv_buffers_( domain_coarse )

    , comm_plan_( domain_coarse )

    {

        bcs_[0] = bcs[0];

        bcs_[1] = bcs[1];

    }


    void set_operator_apply_and_communication_modes(

        const linalg::OperatorApplyMode         operator_apply_mode,

        const linalg::OperatorCommunicationMode operator_communication_mode )

    {

        operator_apply_mode_         = operator_apply_mode;

        operator_communication_mode_ = operator_communication_mode;

    }


    void apply_impl( const SrcVectorType& src, DstVectorType& dst )

    {

        util::Timer timer_apply( "divergence_apply" );


        if ( operator_apply_mode_ == linalg::OperatorApplyMode::Replace )

        {

            assign( dst, 0 );

        }


        src_ = src.grid_data();

        dst_ = dst.grid_data();


        util::Timer timer_kernel( "divergence_kernel" );

        Kokkos::parallel_for( "matvec", grid::shell::local_domain_md_range_policy_cells( domain_fine_ ), *this );

        Kokkos::fence();

        timer_kernel.stop();


        if ( operator_communication_mode_ == linalg::OperatorCommunicationMode::CommunicateAdditively )

        {

            util::Timer timer_comm( "divergence_comm" );

            terra::communication::shell::send_recv_with_plan( comm_plan_, dst_, recv_buffers_ );

        }

    }


    KOKKOS_INLINE_FUNCTION void


        operator()( const int local_subdomain_id, const int x_cell, const int y_cell, const int r_cell ) const

    {

        // Gather surface points for each wedge.

        dense::Vec< ScalarT, 3 > wedge_phy_surf[num_wedges_per_hex_cell][num_nodes_per_wedge_surface] = {};

        wedge_surface_physical_coords( wedge_phy_surf, grid_fine_, local_subdomain_id, x_cell, y_cell );


        // Gather wedge radii.

        const ScalarT r_1 = radii_( local_subdomain_id, r_cell );

        const ScalarT r_2 = radii_( local_subdomain_id, r_cell + 1 );


        // Quadrature points.

        constexpr auto num_quad_points = quadrature::quad_felippa_3x2_num_quad_points;


        dense::Vec< ScalarT, 3 > quad_points[num_quad_points];

        ScalarT                  quad_weights[num_quad_points];


        quadrature::quad_felippa_3x2_quad_points( quad_points );

        quadrature::quad_felippa_3x2_quad_weights( quad_weights );


        const int fine_radial_wedge_index = r_cell % 2;


        // Compute the local element matrix.

        dense::Mat< ScalarT, 6, 18 > A[num_wedges_per_hex_cell] = {};


        for ( int q = 0; q < num_quad_points; q++ )

        {

            for ( int wedge = 0; wedge < num_wedges_per_hex_cell; wedge++ )

            {

                const int fine_lateral_wedge_index = fine_lateral_wedge_idx( x_cell, y_cell, wedge );


                const auto J                = jac( wedge_phy_surf[wedge], r_1, r_2, quad_points[q] );

                const auto det              = Kokkos::abs( J.det() );

                const auto J_inv_transposed = J.inv().transposed();


                for ( int i = 0; i < num_nodes_per_wedge; i++ )

                {

                    const auto shape_i =

                        shape_coarse( i, fine_radial_wedge_index, fine_lateral_wedge_index, quad_points[q] );


                    for ( int j = 0; j < num_nodes_per_wedge; j++ )

                    {

                        const auto grad_j = grad_shape( j, quad_points[q] );


                        for ( int d = 0; d < 3; d++ )

                        {

                            A[wedge]( i, d * 6 + j ) +=

                                quad_weights[q] * ( -( J_inv_transposed * grad_j )(d) *shape_i * det );

                        }

                    }

                }

            }

        }


        bool at_cmb = util::has_flag( boundary_mask_fine_( local_subdomain_id, x_cell, y_cell, r_cell ), CMB );

        bool at_surface =

            util::has_flag( boundary_mask_fine_( local_subdomain_id, x_cell, y_cell, r_cell + 1 ), SURFACE );


        dense::Vec< ScalarT, 18 > src[num_wedges_per_hex_cell];

        for ( int d = 0; d < 3; d++ )

        {

            dense::Vec< ScalarT, 6 > src_d[num_wedges_per_hex_cell];

            extract_local_wedge_vector_coefficients( src_d, local_subdomain_id, x_cell, y_cell, r_cell, d, src_ );


            for ( int wedge = 0; wedge < num_wedges_per_hex_cell; wedge++ )

            {

                for ( int i = 0; i < num_nodes_per_wedge; i++ )

                {

                    src[wedge]( d * 6 + i ) = src_d[wedge]( i );

                }

            }

        }


        // Boundary treatment

        dense::Mat< ScalarT, 6, 18 > boundary_mask;

        boundary_mask.fill( 1.0 );


        dense::Mat< ScalarT, 18, 18 > R[num_wedges_per_hex_cell];


        if ( at_cmb || at_surface )

        {

            // Inner boundary (CMB).

            ShellBoundaryFlag     sbf = at_cmb ? CMB : SURFACE;

            BoundaryConditionFlag bcf = get_boundary_condition_flag( bcs_, sbf );


            if ( bcf == DIRICHLET )

            {

                for ( int dimj = 0; dimj < 3; ++dimj )

                {

                    for ( int i = 0; i < num_nodes_per_wedge; i++ )

                    {

                        for ( int j = 0; j < num_nodes_per_wedge; j++ )

                        {

                            if ( ( at_cmb && ( j < 3 ) ) || ( at_surface && ( j >= 3 ) ) )

                            {

                                boundary_mask( i, dimj * num_nodes_per_wedge + j ) = 0.0;

                            }

                        }

                    }

                }

            }

            else if ( bcf == FREESLIP )

            {

                dense::Mat< ScalarT, 6, 18 > A_tmp[num_wedges_per_hex_cell] = {};


                // reorder source dofs for nodes instead of velocity dims in src vector and local matrix

                for ( int wedge = 0; wedge < 2; ++wedge )

                {

                    for ( int node_idxi = 0; node_idxi < num_nodes_per_wedge; node_idxi++ )

                    {

                        for ( int dimj = 0; dimj < 3; ++dimj )

                        {

                            for ( int node_idxj = 0; node_idxj < num_nodes_per_wedge; node_idxj++ )

                            {

                                A_tmp[wedge]( node_idxi, node_idxj * 3 + dimj ) =

                                    A[wedge]( node_idxi, node_idxj + dimj * num_nodes_per_wedge );

                            }

                        }

                    }

                    reorder_local_dofs( DoFOrdering::DIMENSIONWISE, DoFOrdering::NODEWISE, src[wedge] );

                }


                // assemble rotation matrices for boundary nodes

                // e.g. if we are at CMB, we need to rotate DoFs 0, 1, 2 of each wedge

                // at SURFACE, we need to rotate DoFs 3, 4, 5


                constexpr int layer_hex_offset_x[2][3] = { { 0, 1, 0 }, { 1, 0, 1 } };

                constexpr int layer_hex_offset_y[2][3] = { { 0, 0, 1 }, { 1, 1, 0 } };


                for ( int wedge = 0; wedge < 2; ++wedge )

                {

                    // make rotation matrix unity

                    for ( int i = 0; i < 18; ++i )

                    {

                        R[wedge]( i, i ) = 1.0;

                    }


                    for ( int boundary_node_idx = 0; boundary_node_idx < 3; boundary_node_idx++ )

                    {

                        // compute normal

                        dense::Vec< double, 3 > normal = grid::shell::coords(

                            local_subdomain_id,

                            x_cell + layer_hex_offset_x[wedge][boundary_node_idx],

                            y_cell + layer_hex_offset_y[wedge][boundary_node_idx],

                            r_cell + ( at_cmb ? 0 : 1 ),

                            grid_fine_,

                            radii_ );


                        // compute rotation matrix for DoFs on current node

                        auto R_i = trafo_mat_cartesian_to_normal_tangential( normal );


                        // insert into wedge-local rotation matrix

                        int offset_in_R = at_cmb ? 0 : 9;

                        for ( int dimi = 0; dimi < 3; ++dimi )

                        {

                            for ( int dimj = 0; dimj < 3; ++dimj )

                            {

                                R[wedge](

                                    offset_in_R + boundary_node_idx * 3 + dimi,

                                    offset_in_R + boundary_node_idx * 3 + dimj ) = R_i( dimi, dimj );

                            }

                        }

                    }


                    // transform local matrix to rotated/ normal-tangential space: pre/post multiply with rotation matrices

                    // TODO transpose this way?

                    A[wedge] = A_tmp[wedge] * R[wedge].transposed();

                    // transform source dofs to nt-space

                    auto src_tmp = R[wedge] * src[wedge];

                    for ( int i = 0; i < 18; ++i )

                    {

                        src[wedge]( i ) = src_tmp( i );

                    }


                    // eliminate normal components: Dirichlet on the normal-tangential system

                    int node_start = at_surface ? 3 : 0;

                    int node_end   = at_surface ? 6 : 3;

                    for ( int node_idx = node_start; node_idx < node_end; node_idx++ )

                    {

                        int idx = node_idx * 3;

                        for ( int k = 0; k < 6; ++k )

                        {

                            boundary_mask( k, idx ) = 0.0;

                        }

                    }

                }

            }

            else if ( bcf == NEUMANN ) {}

        }


        // apply boundary mask

        for ( int wedge = 0; wedge < num_wedges_per_hex_cell; wedge++ )

        {

            A[wedge].hadamard_product( boundary_mask );

        }


        dense::Vec< ScalarT, 6 > dst[num_wedges_per_hex_cell];


        dst[0] = A[0] * src[0];

        dst[1] = A[1] * src[1];


        // no need to reorder or post trafo the pressure:

        // independent of dof ordering, div ops map to the same 6 coarse-grid pressure dofs in the same orderinng


        atomically_add_local_wedge_scalar_coefficients(

            dst_, local_subdomain_id, x_cell / 2, y_cell / 2, r_cell / 2, dst );

    }


};


static_assert( linalg::OperatorLike< Divergence< double > > );


} // namespace terra::fe::wedge::operators::shell

terra::communication::shell::ShellBoundaryCommPlan
Definition communication_plan.hpp:33

terra::communication::shell::SubdomainNeighborhoodSendRecvBuffer< ScalarT >

terra::fe::wedge::operators::shell::Divergence
Definition divergence.hpp:32

terra::fe::wedge::operators::shell::Divergence::Divergence
Divergence(const grid::shell::DistributedDomain &domain_fine, const grid::shell::DistributedDomain &domain_coarse, const grid::Grid3DDataVec< ScalarT, 3 > &grid_fine, const grid::Grid2DDataScalar< ScalarT > &radii_fine, const grid::Grid4DDataScalar< grid::shell::ShellBoundaryFlag > &boundary_mask_fine, BoundaryConditions bcs, linalg::OperatorApplyMode operator_apply_mode=linalg::OperatorApplyMode::Replace, linalg::OperatorCommunicationMode operator_communication_mode=linalg::OperatorCommunicationMode::CommunicateAdditively)
Definition divergence.hpp:58

terra::fe::wedge::operators::shell::Divergence::set_operator_apply_and_communication_modes
void set_operator_apply_and_communication_modes(const linalg::OperatorApplyMode operator_apply_mode, const linalg::OperatorCommunicationMode operator_communication_mode)
Definition divergence.hpp:82

terra::fe::wedge::operators::shell::Divergence::apply_impl
void apply_impl(const SrcVectorType &src, DstVectorType &dst)
Definition divergence.hpp:90

terra::fe::wedge::operators::shell::Divergence::ScalarType
ScalarT ScalarType
Definition divergence.hpp:36

terra::fe::wedge::operators::shell::Divergence::operator()
void operator()(const int local_subdomain_id, const int x_cell, const int y_cell, const int r_cell) const
Definition divergence.hpp:115

terra::grid::shell::DistributedDomain
Parallel data structure organizing the thick spherical shell metadata for distributed (MPI parallel) ...
Definition spherical_shell.hpp:2518

terra::linalg::VectorQ1Scalar
Q1 scalar finite element vector on a distributed shell grid.
Definition vector_q1.hpp:21

terra::linalg::VectorQ1Scalar::grid_data
const grid::Grid4DDataScalar< ScalarType > & grid_data() const
Get const reference to grid data.
Definition vector_q1.hpp:139

terra::linalg::VectorQ1Vec< ScalarT, 3 >

terra::linalg::VectorQ1Vec::grid_data
const grid::Grid4DDataVec< ScalarType, VecDim > & grid_data() const
Get const reference to grid data.
Definition vector_q1.hpp:288

terra::util::Timer
Timer supporting RAII scope or manual stop.
Definition timer.hpp:342

terra::util::Timer::stop
void stop()
Stop the timer and record elapsed time.
Definition timer.hpp:364

communication.hpp

communication_plan.hpp

terra::linalg::OperatorLike
Concept for types that behave like linear operators.
Definition operator.hpp:57

integrands.hpp

kernel_helpers.hpp

local_basis_trafo_normal_tangential.hpp

terra::communication::shell::send_recv_with_plan
void send_recv_with_plan(const ShellBoundaryCommPlan< GridDataType > &plan, const GridDataType &data, SubdomainNeighborhoodSendRecvBuffer< typename GridDataType::value_type, grid::grid_data_vec_dim< GridDataType >() > &recv_buffers, CommunicationReduction reduction=CommunicationReduction::SUM)
Definition communication_plan.hpp:652

terra::fe::wedge::operators::shell
Definition boundary_mass.hpp:14

terra::fe::wedge::quadrature::quad_felippa_3x2_quad_weights
constexpr void quad_felippa_3x2_quad_weights(T(&quad_weights)[quad_felippa_3x2_num_quad_points])
Definition wedge/quadrature/quadrature.hpp:93

terra::fe::wedge::quadrature::quad_felippa_3x2_num_quad_points
constexpr int quad_felippa_3x2_num_quad_points
Definition wedge/quadrature/quadrature.hpp:66

terra::fe::wedge::quadrature::quad_felippa_3x2_quad_points
constexpr void quad_felippa_3x2_quad_points(dense::Vec< T, 3 >(&quad_points)[quad_felippa_3x2_num_quad_points])
Definition wedge/quadrature/quadrature.hpp:70

terra::fe::wedge::num_nodes_per_wedge_surface
constexpr int num_nodes_per_wedge_surface
Definition kernel_helpers.hpp:6

terra::fe::wedge::atomically_add_local_wedge_scalar_coefficients
void atomically_add_local_wedge_scalar_coefficients(const grid::Grid4DDataScalar< T > &global_coefficients, const int local_subdomain_id, const int x_cell, const int y_cell, const int r_cell, const dense::Vec< T, 6 >(&local_coefficients)[2])
Performs an atomic add of the two local wedge coefficient vectors of a hex cell into the global coeff...
Definition kernel_helpers.hpp:407

terra::fe::wedge::fine_lateral_wedge_idx
constexpr int fine_lateral_wedge_idx(const int x_cell_fine, const int y_cell_fine, const int wedge_idx_fine)
Returns the lateral wedge index with respect to a coarse grid wedge from the fine wedge indices.
Definition kernel_helpers.hpp:601

terra::fe::wedge::DoFOrdering::DIMENSIONWISE
@ DIMENSIONWISE

terra::fe::wedge::DoFOrdering::NODEWISE
@ NODEWISE

terra::fe::wedge::wedge_surface_physical_coords
void wedge_surface_physical_coords(dense::Vec< T, 3 >(&wedge_surf_phy_coords)[num_wedges_per_hex_cell][num_nodes_per_wedge_surface], const grid::Grid3DDataVec< T, 3 > &lateral_grid, const int local_subdomain_id, const int x_cell, const int y_cell)
Extracts the (unit sphere) surface vertex coords of the two wedges of a hex cell.
Definition kernel_helpers.hpp:26

terra::fe::wedge::reorder_local_dofs
constexpr void reorder_local_dofs(const DoFOrdering doo_from, const DoFOrdering doo_to, dense::Vec< ScalarT, 18 > &dofs)
Definition kernel_helpers.hpp:619

terra::fe::wedge::shape_coarse
constexpr T shape_coarse(const int coarse_node_idx, const int fine_radial_wedge_idx, const int fine_lateral_wedge_idx, const T xi_fine, const T eta_fine, const T zeta_fine)
Definition integrands.hpp:373

terra::fe::wedge::num_wedges_per_hex_cell
constexpr int num_wedges_per_hex_cell
Definition kernel_helpers.hpp:5

terra::fe::wedge::extract_local_wedge_vector_coefficients
void extract_local_wedge_vector_coefficients(dense::Vec< T, 6 >(&local_coefficients)[2], const int local_subdomain_id, const int x_cell, const int y_cell, const int r_cell, const int d, const grid::Grid4DDataVec< T, VecDim > &global_coefficients)
Extracts the local vector coefficients for the two wedges of a hex cell from the global coefficient v...
Definition kernel_helpers.hpp:356

terra::fe::wedge::num_nodes_per_wedge
constexpr int num_nodes_per_wedge
Definition kernel_helpers.hpp:7

terra::fe::wedge::grad_shape
constexpr dense::Vec< T, 3 > grad_shape(const int node_idx, const T xi, const T eta, const T zeta)
Gradient of the full shape function:
Definition integrands.hpp:228

terra::fe::wedge::jac
constexpr dense::Mat< T, 3, 3 > jac(const dense::Vec< T, 3 > &p1_phy, const dense::Vec< T, 3 > &p2_phy, const dense::Vec< T, 3 > &p3_phy, const T r_1, const T r_2, const T xi, const T eta, const T zeta)
Definition integrands.hpp:657

terra::grid::shell::coords
dense::Vec< typename CoordsShellType::value_type, 3 > coords(const int subdomain, const int x, const int y, const int r, const CoordsShellType &coords_shell, const CoordsRadiiType &coords_radii)
Definition spherical_shell.hpp:2871

terra::grid::shell::BoundaryConditions
BoundaryConditionMapping[2] BoundaryConditions
Definition shell/bit_masks.hpp:37

terra::grid::shell::ShellBoundaryFlag
ShellBoundaryFlag
FlagLike that indicates boundary types for the thick spherical shell.
Definition shell/bit_masks.hpp:12

terra::grid::shell::ShellBoundaryFlag::SURFACE
@ SURFACE

terra::grid::shell::ShellBoundaryFlag::CMB
@ CMB

terra::grid::shell::local_domain_md_range_policy_cells
Kokkos::MDRangePolicy< Kokkos::Rank< 4 > > local_domain_md_range_policy_cells(const DistributedDomain &distributed_domain)
Definition spherical_shell.hpp:2739

terra::grid::shell::get_boundary_condition_flag
BoundaryConditionFlag get_boundary_condition_flag(const BoundaryConditions bcs, ShellBoundaryFlag sbf)
Retrieve the boundary condition flag that is associated with a location in the shell e....
Definition shell/bit_masks.hpp:42

terra::grid::shell::BoundaryConditionFlag
BoundaryConditionFlag
FlagLike that indicates the type of boundary condition
Definition shell/bit_masks.hpp:25

terra::grid::shell::BoundaryConditionFlag::FREESLIP
@ FREESLIP

terra::grid::shell::BoundaryConditionFlag::NEUMANN
@ NEUMANN

terra::grid::shell::BoundaryConditionFlag::DIRICHLET
@ DIRICHLET

terra::grid::Grid3DDataVec
Kokkos::View< ScalarType ***[VecDim], Layout > Grid3DDataVec
Definition grid_types.hpp:42

terra::grid::Grid4DDataScalar
Kokkos::View< ScalarType ****, Layout > Grid4DDataScalar
Definition grid_types.hpp:27

terra::grid::Grid2DDataScalar
Kokkos::View< ScalarType **, Layout > Grid2DDataScalar
Definition grid_types.hpp:21

terra::linalg::trafo::trafo_mat_cartesian_to_normal_tangential
dense::Mat< ScalarType, 3, 3 > trafo_mat_cartesian_to_normal_tangential(const dense::Vec< ScalarType, 3 > &n_input)
Constructs a robust orthonormal transformation matrix from Cartesian to (normal–tangential–tangential...
Definition local_basis_trafo_normal_tangential.hpp:36

terra::linalg::OperatorApplyMode
OperatorApplyMode
Modes for applying an operator to a vector.
Definition operator.hpp:30

terra::linalg::OperatorApplyMode::Replace
@ Replace
Overwrite the destination vector.

terra::linalg::OperatorCommunicationMode
OperatorCommunicationMode
Modes for communication during operator application.
Definition operator.hpp:40

terra::linalg::OperatorCommunicationMode::CommunicateAdditively
@ CommunicateAdditively
Communicate and add results.

terra::util::has_flag
constexpr bool has_flag(E mask_value, E flag) noexcept
Checks if a bitmask value contains a specific flag.
Definition bit_masking.hpp:43

operator.hpp

spherical_shell.hpp

terra::dense::Mat
Definition mat.hpp:10

terra::dense::Mat::fill
void fill(const T value)
Definition mat.hpp:201

terra::dense::Mat::transposed
constexpr Mat< T, Cols, Rows > transposed() const
Definition mat.hpp:187

terra::dense::Mat::hadamard_product
Mat & hadamard_product(const Mat &mat)
Definition mat.hpp:213

terra::dense::Vec< ScalarT, 3 >

terra::grid::Grid4DDataVec< ScalarType, 3 >

timer.hpp

vec.hpp

vector.hpp

vector_q1.hpp