terraneo/laplace_8hpp_source.html

#pragma once


#include "../../quadrature/quadrature.hpp"

#include "communication/shell/communication.hpp"

#include "dense/vec.hpp"

#include "fe/wedge/integrands.hpp"

#include "fe/wedge/kernel_helpers.hpp"

#include "grid/shell/spherical_shell.hpp"

#include "linalg/operator.hpp"

#include "linalg/vector.hpp"

#include "linalg/vector_q1.hpp"

#include "util/timer.hpp"


namespace terra::fe::wedge::operators::shell {


template < typename ScalarT >


class Laplace

{

  public:

    using SrcVectorType = linalg::VectorQ1Scalar< ScalarT >;

    using DstVectorType = linalg::VectorQ1Scalar< ScalarT >;

    using ScalarType    = ScalarT;


  private:

    grid::shell::DistributedDomain domain_;


    grid::Grid3DDataVec< ScalarT, 3 >                        grid_;

    grid::Grid2DDataScalar< ScalarT >                        radii_;

    grid::Grid4DDataScalar< grid::shell::ShellBoundaryFlag > mask_;


    bool treat_boundary_;

    bool diagonal_;


    linalg::OperatorApplyMode         operator_apply_mode_;

    linalg::OperatorCommunicationMode operator_communication_mode_;


    communication::shell::SubdomainNeighborhoodSendRecvBuffer< ScalarT > send_buffers_;

    communication::shell::SubdomainNeighborhoodSendRecvBuffer< ScalarT > recv_buffers_;


    grid::Grid4DDataScalar< ScalarType > src_;

    grid::Grid4DDataScalar< ScalarType > dst_;


  public:


    Laplace(

        const grid::shell::DistributedDomain&                           domain,

        const grid::Grid3DDataVec< ScalarT, 3 >&                        grid,

        const grid::Grid2DDataScalar< ScalarT >&                        radii,

        const grid::Grid4DDataScalar< grid::shell::ShellBoundaryFlag >& mask,

        bool                                                            treat_boundary,

        bool                                                            diagonal,

        linalg::OperatorApplyMode         operator_apply_mode = linalg::OperatorApplyMode::Replace,

        linalg::OperatorCommunicationMode operator_communication_mode =

            linalg::OperatorCommunicationMode::CommunicateAdditively )

    : domain_( domain )

    , grid_( grid )

    , radii_( radii )

    , mask_( mask )

    , treat_boundary_( treat_boundary )

    , diagonal_( diagonal )

    , operator_apply_mode_( operator_apply_mode )

    , operator_communication_mode_( operator_communication_mode )

    // TODO: we can reuse the send and recv buffers and pass in from the outside somehow

    , send_buffers_( domain )

    , recv_buffers_( domain )

    {}


    void apply_impl( const SrcVectorType& src, DstVectorType& dst )

    {

        util::Timer timer_apply( "laplace_apply" );


        if ( operator_apply_mode_ == linalg::OperatorApplyMode::Replace )

        {

            assign( dst, 0 );

        }


        src_ = src.grid_data();

        dst_ = dst.grid_data();


        if ( src_.extent( 0 ) != dst_.extent( 0 ) || src_.extent( 1 ) != dst_.extent( 1 ) ||

             src_.extent( 2 ) != dst_.extent( 2 ) || src_.extent( 3 ) != dst_.extent( 3 ) )

        {

            throw std::runtime_error( "LaplaceSimple: src/dst mismatch" );

        }


        if ( src_.extent( 1 ) != grid_.extent( 1 ) || src_.extent( 2 ) != grid_.extent( 2 ) )

        {

            throw std::runtime_error( "LaplaceSimple: src/dst mismatch" );

        }


        util::Timer timer_kernel( "laplace_kernel" );

        Kokkos::parallel_for( "matvec", grid::shell::local_domain_md_range_policy_cells( domain_ ), *this );

        Kokkos::fence();

        timer_kernel.stop();


        if ( operator_communication_mode_ == linalg::OperatorCommunicationMode::CommunicateAdditively )

        {

            util::Timer timer_comm( "laplace_comm" );

            communication::shell::pack_send_and_recv_local_subdomain_boundaries(

                domain_, dst_, send_buffers_, recv_buffers_ );

            communication::shell::unpack_and_reduce_local_subdomain_boundaries( domain_, dst_, recv_buffers_ );

        }

    }


    KOKKOS_INLINE_FUNCTION void


        operator()( const int local_subdomain_id, const int x_cell, const int y_cell, const int r_cell ) const

    {

        // Gather surface points for each wedge.

        dense::Vec< ScalarT, 3 > wedge_phy_surf[num_wedges_per_hex_cell][num_nodes_per_wedge_surface] = {};

        wedge_surface_physical_coords( wedge_phy_surf, grid_, local_subdomain_id, x_cell, y_cell );


        // Gather wedge radii.

        const ScalarT r_1 = radii_( local_subdomain_id, r_cell );

        const ScalarT r_2 = radii_( local_subdomain_id, r_cell + 1 );


        // Quadrature points.

        constexpr auto num_quad_points = quadrature::quad_felippa_3x2_num_quad_points;


        dense::Vec< ScalarT, 3 > quad_points[num_quad_points];

        ScalarT                  quad_weights[num_quad_points];


        quadrature::quad_felippa_3x2_quad_points( quad_points );

        quadrature::quad_felippa_3x2_quad_weights( quad_weights );


        // Compute the local element matrix.


        ScalarType src_local_hex[8] = { 0 };

        ScalarType dst_local_hex[8] = { 0 };


        for ( int i = 0; i < 8; i++ )

        {

            constexpr int hex_offset_x[8] = { 0, 1, 0, 1, 0, 1, 0, 1 };

            constexpr int hex_offset_y[8] = { 0, 0, 1, 1, 0, 0, 1, 1 };

            constexpr int hex_offset_r[8] = { 0, 0, 0, 0, 1, 1, 1, 1 };


            src_local_hex[i] = src_(

                local_subdomain_id, x_cell + hex_offset_x[i], y_cell + hex_offset_y[i], r_cell + hex_offset_r[i] );

        }


        const bool at_bot_boundary =

            util::has_flag( mask_( local_subdomain_id, x_cell, y_cell, r_cell ), grid::shell::ShellBoundaryFlag::CMB );

        const bool at_top_boundary = util::has_flag(

            mask_( local_subdomain_id, x_cell, y_cell, r_cell + 1 ), grid::shell::ShellBoundaryFlag::SURFACE );


        for ( int wedge = 0; wedge < num_wedges_per_hex_cell; wedge++ )

        {

            for ( int q = 0; q < num_quad_points; q++ )

            {

                const auto quad_point  = quad_points[q];

                const auto quad_weight = quad_weights[q];


                // 1. Compute Jacobian and inverse at this quadrature point.


                const auto J                = jac( wedge_phy_surf[wedge], r_1, r_2, quad_points[q] );

                const auto det              = J.det();

                const auto abs_det          = Kokkos::abs( det );

                const auto J_inv_transposed = J.inv_transposed( det );


                // 2. Compute physical gradients for all nodes at this quadrature point.

                dense::Vec< ScalarType, 3 > grad_phy[num_nodes_per_wedge];

                for ( int k = 0; k < num_nodes_per_wedge; k++ )

                {

                    grad_phy[k] = J_inv_transposed * grad_shape( k, quad_point );

                }


                if ( diagonal_ )

                {

                    diagonal( src_local_hex, dst_local_hex, wedge, quad_weight, abs_det, grad_phy );

                }

                else if ( treat_boundary_ && at_bot_boundary )

                {

                    // Bottom boundary dirichlet

                    dirichlet_bot( src_local_hex, dst_local_hex, wedge, quad_weight, abs_det, grad_phy );

                }

                else if ( treat_boundary_ && at_top_boundary )

                {

                    // Top boundary dirichlet

                    dirichlet_top( src_local_hex, dst_local_hex, wedge, quad_weight, abs_det, grad_phy );

                }

                else

                {

                    neumann( src_local_hex, dst_local_hex, wedge, quad_weight, abs_det, grad_phy );

                }

            }

        }


        for ( int i = 0; i < 8; i++ )

        {

            constexpr int hex_offset_x[8] = { 0, 1, 0, 1, 0, 1, 0, 1 };

            constexpr int hex_offset_y[8] = { 0, 0, 1, 1, 0, 0, 1, 1 };

            constexpr int hex_offset_r[8] = { 0, 0, 0, 0, 1, 1, 1, 1 };


            Kokkos::atomic_add(

                &dst_(

                    local_subdomain_id, x_cell + hex_offset_x[i], y_cell + hex_offset_y[i], r_cell + hex_offset_r[i] ),

                dst_local_hex[i] );

        }

    }


    KOKKOS_INLINE_FUNCTION void neumann(

        ScalarType*                        src_local_hex,

        ScalarType*                        dst_local_hex,

        const int                          wedge,

        const ScalarType                   quad_weight,

        const ScalarType                   abs_det,

        const dense::Vec< ScalarType, 3 >* grad_phy ) const

    {

        constexpr int offset_x[2][6] = { { 0, 1, 0, 0, 1, 0 }, { 1, 0, 1, 1, 0, 1 } };

        constexpr int offset_y[2][6] = { { 0, 0, 1, 0, 0, 1 }, { 1, 1, 0, 1, 1, 0 } };

        constexpr int offset_r[2][6] = { { 0, 0, 0, 1, 1, 1 }, { 0, 0, 0, 1, 1, 1 } };


        // 3. Compute ∇u at this quadrature point.

        dense::Vec< ScalarType, 3 > grad_u;

        grad_u.fill( 0.0 );

        for ( int j = 0; j < num_nodes_per_wedge; j++ )

        {

            grad_u = grad_u +

                     src_local_hex[4 * offset_r[wedge][j] + 2 * offset_y[wedge][j] + offset_x[wedge][j]] * grad_phy[j];

        }


        // 4. Add the test function contributions.

        for ( int i = 0; i < num_nodes_per_wedge; i++ )

        {

            dst_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] +=

                quad_weight * grad_phy[i].dot( grad_u ) * abs_det;

        }

    }


    KOKKOS_INLINE_FUNCTION void dirichlet_bot(

        ScalarType*                        src_local_hex,

        ScalarType*                        dst_local_hex,

        const int                          wedge,

        const ScalarType                   quad_weight,

        const ScalarType                   abs_det,

        const dense::Vec< ScalarType, 3 >* grad_phy ) const

    {

        constexpr int offset_x[2][6] = { { 0, 1, 0, 0, 1, 0 }, { 1, 0, 1, 1, 0, 1 } };

        constexpr int offset_y[2][6] = { { 0, 0, 1, 0, 0, 1 }, { 1, 1, 0, 1, 1, 0 } };

        constexpr int offset_r[2][6] = { { 0, 0, 0, 1, 1, 1 }, { 0, 0, 0, 1, 1, 1 } };


        // 3. Compute ∇u at this quadrature point.

        dense::Vec< ScalarType, 3 > grad_u;

        grad_u.fill( 0.0 );

        for ( int j = 3; j < num_nodes_per_wedge; j++ )

        {

            grad_u = grad_u +

                     src_local_hex[4 * offset_r[wedge][j] + 2 * offset_y[wedge][j] + offset_x[wedge][j]] * grad_phy[j];

        }


        // 4. Add the test function contributions.

        for ( int i = 3; i < num_nodes_per_wedge; i++ )

        {

            dst_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] +=

                quad_weight * grad_phy[i].dot( grad_u ) * abs_det;

        }


        // Diagonal for top part

        for ( int i = 0; i < 3; i++ )

        {

            const auto grad_u_diag =

                src_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] * grad_phy[i];


            dst_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] +=

                quad_weight * grad_phy[i].dot( grad_u_diag ) * abs_det;

        }

    }


    KOKKOS_INLINE_FUNCTION void dirichlet_top(

        ScalarType*                        src_local_hex,

        ScalarType*                        dst_local_hex,

        const int                          wedge,

        const ScalarType                   quad_weight,

        const ScalarType                   abs_det,

        const dense::Vec< ScalarType, 3 >* grad_phy ) const

    {

        constexpr int offset_x[2][6] = { { 0, 1, 0, 0, 1, 0 }, { 1, 0, 1, 1, 0, 1 } };

        constexpr int offset_y[2][6] = { { 0, 0, 1, 0, 0, 1 }, { 1, 1, 0, 1, 1, 0 } };

        constexpr int offset_r[2][6] = { { 0, 0, 0, 1, 1, 1 }, { 0, 0, 0, 1, 1, 1 } };


        // 3. Compute ∇u at this quadrature point.

        dense::Vec< ScalarType, 3 > grad_u;

        grad_u.fill( 0.0 );

        for ( int j = 0; j < 3; j++ )

        {

            grad_u = grad_u +

                     src_local_hex[4 * offset_r[wedge][j] + 2 * offset_y[wedge][j] + offset_x[wedge][j]] * grad_phy[j];

        }


        // 4. Add the test function contributions.

        for ( int i = 0; i < 3; i++ )

        {

            dst_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] +=

                quad_weight * grad_phy[i].dot( grad_u ) * abs_det;

        }


        // Diagonal for top part

        for ( int i = 3; i < num_nodes_per_wedge; i++ )

        {

            const auto grad_u_diag =

                src_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] * grad_phy[i];


            dst_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] +=

                quad_weight * grad_phy[i].dot( grad_u_diag ) * abs_det;

        }

    }


    KOKKOS_INLINE_FUNCTION void diagonal(

        ScalarType*                        src_local_hex,

        ScalarType*                        dst_local_hex,

        const int                          wedge,

        const ScalarType                   quad_weight,

        const ScalarType                   abs_det,

        const dense::Vec< ScalarType, 3 >* grad_phy ) const

    {

        constexpr int offset_x[2][6] = { { 0, 1, 0, 0, 1, 0 }, { 1, 0, 1, 1, 0, 1 } };

        constexpr int offset_y[2][6] = { { 0, 0, 1, 0, 0, 1 }, { 1, 1, 0, 1, 1, 0 } };

        constexpr int offset_r[2][6] = { { 0, 0, 0, 1, 1, 1 }, { 0, 0, 0, 1, 1, 1 } };


        // 3. Compute ∇u at this quadrature point.

        // 4. Add the test function contributions.

        for ( int i = 0; i < num_nodes_per_wedge; i++ )

        {

            const auto grad_u =

                src_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] * grad_phy[i];


            dst_local_hex[4 * offset_r[wedge][i] + 2 * offset_y[wedge][i] + offset_x[wedge][i]] +=

                quad_weight * grad_phy[i].dot( grad_u ) * abs_det;

        }

    }


};


static_assert( linalg::OperatorLike< Laplace< float > > );

static_assert( linalg::OperatorLike< Laplace< double > > );


} // namespace terra::fe::wedge::operators::shell

terra::communication::shell::SubdomainNeighborhoodSendRecvBuffer< ScalarT >

terra::fe::wedge::operators::shell::Laplace
Definition laplace.hpp:19

terra::fe::wedge::operators::shell::Laplace::neumann
void neumann(ScalarType *src_local_hex, ScalarType *dst_local_hex, const int wedge, const ScalarType quad_weight, const ScalarType abs_det, const dense::Vec< ScalarType, 3 > *grad_phy) const
Definition laplace.hpp:200

terra::fe::wedge::operators::shell::Laplace::dirichlet_bot
void dirichlet_bot(ScalarType *src_local_hex, ScalarType *dst_local_hex, const int wedge, const ScalarType quad_weight, const ScalarType abs_det, const dense::Vec< ScalarType, 3 > *grad_phy) const
Definition laplace.hpp:229

terra::fe::wedge::operators::shell::Laplace::ScalarType
ScalarT ScalarType
Definition laplace.hpp:23

terra::fe::wedge::operators::shell::Laplace::diagonal
void diagonal(ScalarType *src_local_hex, ScalarType *dst_local_hex, const int wedge, const ScalarType quad_weight, const ScalarType abs_det, const dense::Vec< ScalarType, 3 > *grad_phy) const
Definition laplace.hpp:307

terra::fe::wedge::operators::shell::Laplace::apply_impl
void apply_impl(const SrcVectorType &src, DstVectorType &dst)
Definition laplace.hpp:68

terra::fe::wedge::operators::shell::Laplace::operator()
void operator()(const int local_subdomain_id, const int x_cell, const int y_cell, const int r_cell) const
Definition laplace.hpp:106

terra::fe::wedge::operators::shell::Laplace::Laplace
Laplace(const grid::shell::DistributedDomain &domain, const grid::Grid3DDataVec< ScalarT, 3 > &grid, const grid::Grid2DDataScalar< ScalarT > &radii, const grid::Grid4DDataScalar< grid::shell::ShellBoundaryFlag > &mask, bool treat_boundary, bool diagonal, linalg::OperatorApplyMode operator_apply_mode=linalg::OperatorApplyMode::Replace, linalg::OperatorCommunicationMode operator_communication_mode=linalg::OperatorCommunicationMode::CommunicateAdditively)
Definition laplace.hpp:45

terra::fe::wedge::operators::shell::Laplace::dirichlet_top
void dirichlet_top(ScalarType *src_local_hex, ScalarType *dst_local_hex, const int wedge, const ScalarType quad_weight, const ScalarType abs_det, const dense::Vec< ScalarType, 3 > *grad_phy) const
Definition laplace.hpp:268

terra::grid::shell::DistributedDomain
Parallel data structure organizing the thick spherical shell metadata for distributed (MPI parallel) ...
Definition spherical_shell.hpp:2518

terra::linalg::VectorQ1Scalar
Q1 scalar finite element vector on a distributed shell grid.
Definition vector_q1.hpp:21

terra::linalg::VectorQ1Scalar::grid_data
const grid::Grid4DDataScalar< ScalarType > & grid_data() const
Get const reference to grid data.
Definition vector_q1.hpp:139

terra::util::Timer
Timer supporting RAII scope or manual stop.
Definition timer.hpp:342

terra::util::Timer::stop
void stop()
Stop the timer and record elapsed time.
Definition timer.hpp:364

communication.hpp

terra::linalg::OperatorLike
Concept for types that behave like linear operators.
Definition operator.hpp:57

integrands.hpp

kernel_helpers.hpp

terra::communication::shell::unpack_and_reduce_local_subdomain_boundaries
void unpack_and_reduce_local_subdomain_boundaries(const grid::shell::DistributedDomain &domain, const GridDataType &data, SubdomainNeighborhoodSendRecvBuffer< typename GridDataType::value_type, grid::grid_data_vec_dim< GridDataType >() > &boundary_recv_buffers, CommunicationReduction reduction=CommunicationReduction::SUM)
Unpacks and reduces local subdomain boundaries.
Definition communication.hpp:672

terra::communication::shell::pack_send_and_recv_local_subdomain_boundaries
void pack_send_and_recv_local_subdomain_boundaries(const grid::shell::DistributedDomain &domain, const GridDataType &data, SubdomainNeighborhoodSendRecvBuffer< typename GridDataType::value_type, grid::grid_data_vec_dim< GridDataType >() > &boundary_send_buffers, SubdomainNeighborhoodSendRecvBuffer< typename GridDataType::value_type, grid::grid_data_vec_dim< GridDataType >() > &boundary_recv_buffers)
Packs, sends and recvs local subdomain boundaries using two sets of buffers.
Definition communication.hpp:242

terra::fe::wedge::operators::shell
Definition boundary_mass.hpp:14

terra::fe::wedge::quadrature::quad_felippa_3x2_quad_weights
constexpr void quad_felippa_3x2_quad_weights(T(&quad_weights)[quad_felippa_3x2_num_quad_points])
Definition wedge/quadrature/quadrature.hpp:93

terra::fe::wedge::quadrature::quad_felippa_3x2_num_quad_points
constexpr int quad_felippa_3x2_num_quad_points
Definition wedge/quadrature/quadrature.hpp:66

terra::fe::wedge::quadrature::quad_felippa_3x2_quad_points
constexpr void quad_felippa_3x2_quad_points(dense::Vec< T, 3 >(&quad_points)[quad_felippa_3x2_num_quad_points])
Definition wedge/quadrature/quadrature.hpp:70

terra::fe::wedge::num_nodes_per_wedge_surface
constexpr int num_nodes_per_wedge_surface
Definition kernel_helpers.hpp:6

terra::fe::wedge::wedge_surface_physical_coords
void wedge_surface_physical_coords(dense::Vec< T, 3 >(&wedge_surf_phy_coords)[num_wedges_per_hex_cell][num_nodes_per_wedge_surface], const grid::Grid3DDataVec< T, 3 > &lateral_grid, const int local_subdomain_id, const int x_cell, const int y_cell)
Extracts the (unit sphere) surface vertex coords of the two wedges of a hex cell.
Definition kernel_helpers.hpp:26

terra::fe::wedge::num_wedges_per_hex_cell
constexpr int num_wedges_per_hex_cell
Definition kernel_helpers.hpp:5

terra::fe::wedge::num_nodes_per_wedge
constexpr int num_nodes_per_wedge
Definition kernel_helpers.hpp:7

terra::fe::wedge::grad_shape
constexpr dense::Vec< T, 3 > grad_shape(const int node_idx, const T xi, const T eta, const T zeta)
Gradient of the full shape function:
Definition integrands.hpp:228

terra::fe::wedge::jac
constexpr dense::Mat< T, 3, 3 > jac(const dense::Vec< T, 3 > &p1_phy, const dense::Vec< T, 3 > &p2_phy, const dense::Vec< T, 3 > &p3_phy, const T r_1, const T r_2, const T xi, const T eta, const T zeta)
Definition integrands.hpp:657

terra::grid::shell::ShellBoundaryFlag::SURFACE
@ SURFACE

terra::grid::shell::ShellBoundaryFlag::CMB
@ CMB

terra::grid::shell::local_domain_md_range_policy_cells
Kokkos::MDRangePolicy< Kokkos::Rank< 4 > > local_domain_md_range_policy_cells(const DistributedDomain &distributed_domain)
Definition spherical_shell.hpp:2739

terra::grid::Grid3DDataVec
Kokkos::View< ScalarType ***[VecDim], Layout > Grid3DDataVec
Definition grid_types.hpp:42

terra::grid::Grid4DDataScalar
Kokkos::View< ScalarType ****, Layout > Grid4DDataScalar
Definition grid_types.hpp:27

terra::grid::Grid2DDataScalar
Kokkos::View< ScalarType **, Layout > Grid2DDataScalar
Definition grid_types.hpp:21

terra::linalg::OperatorApplyMode
OperatorApplyMode
Modes for applying an operator to a vector.
Definition operator.hpp:30

terra::linalg::OperatorApplyMode::Replace
@ Replace
Overwrite the destination vector.

terra::linalg::OperatorCommunicationMode
OperatorCommunicationMode
Modes for communication during operator application.
Definition operator.hpp:40

terra::linalg::OperatorCommunicationMode::CommunicateAdditively
@ CommunicateAdditively
Communicate and add results.

terra::util::has_flag
constexpr bool has_flag(E mask_value, E flag) noexcept
Checks if a bitmask value contains a specific flag.
Definition bit_masking.hpp:43

operator.hpp

spherical_shell.hpp

terra::dense::Vec< ScalarT, 3 >

terra::dense::Vec::dot
T dot(const Vec &other) const
Definition vec.hpp:39

timer.hpp

vec.hpp

vector.hpp

vector_q1.hpp