doxygen/html/functional__qoi_8inl_source.html

 // Copyright (c) 2019-2024, Lawrence Livermore National Security, LLC and

 // other Serac Project Developers. See the top-level LICENSE file for

 // details.

 //

 // SPDX-License-Identifier: (BSD-3-Clause)


 namespace serac {


 struct QoIProlongation {

   QoIProlongation() {}


   QoIProlongation(MPI_Comm c) : comm(c) {}


   void Mult(const mfem::Vector&, mfem::Vector&) const { SLIC_ERROR_ROOT("QoIProlongation::Mult() is not defined"); }


   void MultTranspose(const mfem::Vector& input, mfem::Vector& output) const

   {

     // const_cast to work around clang@14.0.6 compiler error:

     //   "argument type 'const double *' doesn't match specified 'MPI' type tag that requires 'double *'"

     MPI_Allreduce(const_cast<double*>(&input[0]), &output[0], 1, MPI_DOUBLE, MPI_SUM, comm);

   }


   MPI_Comm comm;

 };


 struct QoIElementRestriction {

   void ScatterAdd(const mfem::Vector& input, mfem::Vector& output) const { output[0] += input.Sum(); }

 };


 template <typename... trials, ExecutionSpace exec>

 class Functional<double(trials...), exec> {

   using test = QOI;

   static constexpr tuple<trials...> trial_spaces{};

   static constexpr uint32_t         num_trial_spaces = sizeof...(trials);

   static constexpr auto             Q                = std::max({test::order, trials::order...}) + 1;


   class Gradient;


   // clang-format off

   template <uint32_t i>

   struct operator_paren_return {

     using type = typename std::conditional<

         i == NO_DIFFERENTIATION,          // if `i` is greater than or equal to zero,

         double,                           // wise, we just return the value

         serac::tuple<double&, Gradient&>  // otherwise, we return the value and the derivative w.r.t arg `i`

         >::type;

   };

   // clang-format on


 public:

   Functional(std::array<const mfem::ParFiniteElementSpace*, num_trial_spaces> trial_fes)

       : test_fec_(0, trial_fes[0]->GetMesh()->Dimension()),

         test_space_(dynamic_cast<mfem::ParMesh*>(trial_fes[0]->GetMesh()), &test_fec_),

         trial_space_(trial_fes)

   {

     auto* mesh = trial_fes[0]->GetMesh();


     auto mem_type = mfem::Device::GetMemoryType();


     for (auto type : {Domain::Type::Elements, Domain::Type::BoundaryElements}) {

       input_E_[type].resize(num_trial_spaces);

     }


     for (uint32_t i = 0; i < num_trial_spaces; i++) {

       P_trial_[i] = trial_space_[i]->GetProlongationMatrix();


       input_L_[i].SetSize(P_trial_[i]->Height(), mfem::Device::GetMemoryType());


       for (auto type : {Domain::Type::Elements, Domain::Type::BoundaryElements}) {

         if (type == Domain::Type::Elements) {

           G_trial_[type][i] = BlockElementRestriction(trial_fes[i]);

         } else {

           G_trial_[type][i] = BlockElementRestriction(trial_fes[i], FaceType::BOUNDARY);

         }


         // note: we have to use "Update" here, as mfem::BlockVector's

         // copy assignment ctor (operator=) doesn't let you make changes

         // to the block size

         input_E_[type][i].Update(G_trial_[type][i].bOffsets(), mem_type);

       }

     }


     for (auto type : {Domain::Type::Elements, Domain::Type::BoundaryElements}) {

       std::array<uint32_t, mfem::Geometry::NUM_GEOMETRIES> counts{};

       if (type == Domain::Type::Elements) {

         counts = geometry_counts(*mesh);

       } else {

         counts = boundary_geometry_counts(*mesh);

       }


       mfem::Array<int> offsets(mfem::Geometry::NUM_GEOMETRIES + 1);

       offsets[0] = 0;

       for (int i = 0; i < mfem::Geometry::NUM_GEOMETRIES; i++) {

         auto g         = mfem::Geometry::Type(i);

         offsets[g + 1] = offsets[g] + int(counts[uint32_t(g)]);

       }


       output_E_[type].Update(offsets, mem_type);

     }


     G_test_ = QoIElementRestriction();

     P_test_ = QoIProlongation(trial_fes[0]->GetParMesh()->GetComm());


     output_L_.SetSize(1, mem_type);


     output_T_.SetSize(1, mfem::Device::GetMemoryType());


     // gradient objects depend on some member variables in

     // Functional, so we initialize the gradient objects last

     // to ensure that those member variables are initialized first

     for (uint32_t i = 0; i < num_trial_spaces; i++) {

       grad_.emplace_back(*this, i);

     }

   }


   template <int dim, int... args, typename lambda, typename qpt_data_type = Nothing>

   void AddDomainIntegral(Dimension<dim>, DependsOn<args...>, lambda&& integrand, mfem::Mesh& mesh,

                          std::shared_ptr<QuadratureData<qpt_data_type>> qdata = NoQData)

   {

     if (mesh.GetNE() == 0) return;


     SLIC_ERROR_ROOT_IF(dim != mesh.Dimension(), "invalid mesh dimension for domain integral");


     check_for_unsupported_elements(mesh);

     check_for_missing_nodal_gridfunc(mesh);


     using signature = test(decltype(serac::type<args>(trial_spaces))...);

     integrals_.push_back(

         MakeDomainIntegral<signature, Q, dim>(EntireDomain(mesh), integrand, qdata, std::vector<uint32_t>{args...}));

   }


   template <int dim, int... args, typename lambda, typename qpt_data_type = Nothing>

   void AddDomainIntegral(Dimension<dim>, DependsOn<args...>, lambda&& integrand, Domain& domain,

                          std::shared_ptr<QuadratureData<qpt_data_type>> qdata = NoQData)

   {

     if (domain.mesh_.GetNE() == 0) return;


     SLIC_ERROR_ROOT_IF(dim != domain.mesh_.Dimension(), "invalid mesh dimension for domain integral");


     check_for_unsupported_elements(domain.mesh_);

     check_for_missing_nodal_gridfunc(domain.mesh_);


     using signature = test(decltype(serac::type<args>(trial_spaces))...);

     integrals_.push_back(

         MakeDomainIntegral<signature, Q, dim>(domain, integrand, qdata, std::vector<uint32_t>{args...}));

   }


   template <int dim, int... args, typename lambda, typename qpt_data_type = void>

   void AddBoundaryIntegral(Dimension<dim>, DependsOn<args...>, lambda&& integrand, mfem::Mesh& mesh)

   {

     auto num_bdr_elements = mesh.GetNBE();

     if (num_bdr_elements == 0) return;


     check_for_missing_nodal_gridfunc(mesh);


     using signature = test(decltype(serac::type<args>(trial_spaces))...);

     integrals_.push_back(

         MakeBoundaryIntegral<signature, Q, dim>(EntireBoundary(mesh), integrand, std::vector<uint32_t>{args...}));

   }


   template <int dim, int... args, typename lambda>

   void AddBoundaryIntegral(Dimension<dim>, DependsOn<args...>, lambda&& integrand, const Domain& domain)

   {

     auto num_bdr_elements = domain.mesh_.GetNBE();

     if (num_bdr_elements == 0) return;


     SLIC_ERROR_ROOT_IF(dim != domain.dim_, "invalid domain of integration for boundary integral");


     check_for_missing_nodal_gridfunc(domain.mesh_);


     using signature = test(decltype(serac::type<args>(trial_spaces))...);

     integrals_.push_back(MakeBoundaryIntegral<signature, Q, dim>(domain, integrand, std::vector<uint32_t>{args...}));

   }


   template <int... args, typename lambda, typename qpt_data_type = Nothing>

   void AddAreaIntegral(DependsOn<args...> which_args, lambda&& integrand, mfem::Mesh& domain,

                        std::shared_ptr<QuadratureData<qpt_data_type>>& data = NoQData)

   {

     AddDomainIntegral(Dimension<2>{}, which_args, integrand, domain, data);

   }


   template <int... args, typename lambda, typename qpt_data_type = Nothing>

   void AddVolumeIntegral(DependsOn<args...> which_args, lambda&& integrand, mfem::Mesh& domain,

                          std::shared_ptr<QuadratureData<qpt_data_type>>& data = NoQData)

   {

     AddDomainIntegral(Dimension<3>{}, which_args, integrand, domain, data);

   }


   template <int... args, typename lambda>

   void AddSurfaceIntegral(DependsOn<args...> which_args, lambda&& integrand, mfem::Mesh& domain)

   {

     AddBoundaryIntegral(Dimension<2>{}, which_args, integrand, domain);

   }


   double ActionOfGradient(const mfem::Vector& input_T, uint32_t which) const

   {

     P_trial_[which]->Mult(input_T, input_L_[which]);


     output_L_ = 0.0;


     // this is used to mark when gather operations have been performed,

     // to avoid doing them more than once per trial space

     bool already_computed[Domain::num_types]{};  // default initializes to `false`


     for (auto& integral : integrals_) {

       auto type = integral.domain_.type_;


       if (!already_computed[type]) {

         G_trial_[type][which].Gather(input_L_[which], input_E_[type][which]);

         already_computed[type] = true;

       }


       integral.GradientMult(input_E_[type][which], output_E_[type], which);


       // scatter-add to compute residuals on the local processor

       G_test_.ScatterAdd(output_E_[type], output_L_);

     }


     // scatter-add to compute global residuals

     P_test_.MultTranspose(output_L_, output_T_);


     return output_T_[0];

   }


   template <uint32_t wrt, typename... T>

   typename operator_paren_return<wrt>::type operator()(DifferentiateWRT<wrt>, double t, const T&... args)

   {

     const mfem::Vector* input_T[] = {&static_cast<const mfem::Vector&>(args)...};


     // get the values for each local processor

     for (uint32_t i = 0; i < num_trial_spaces; i++) {

       P_trial_[i]->Mult(*input_T[i], input_L_[i]);

     }


     output_L_ = 0.0;


     // this is used to mark when operations have been performed,

     // to avoid doing them more than once

     bool already_computed[Domain::num_types][num_trial_spaces]{};  // default initializes to `false`


     for (auto& integral : integrals_) {

       auto type = integral.domain_.type_;


       for (auto i : integral.active_trial_spaces_) {

         if (!already_computed[type][i]) {

           G_trial_[type][i].Gather(input_L_[i], input_E_[type][i]);

           already_computed[type][i] = true;

         }

       }


       const bool update_state = false;

       integral.Mult(t, input_E_[type], output_E_[type], wrt, update_state);


       // scatter-add to compute residuals on the local processor

       G_test_.ScatterAdd(output_E_[type], output_L_);

     }


     // scatter-add to compute global residuals

     P_test_.MultTranspose(output_L_, output_T_);


     if constexpr (wrt != NO_DIFFERENTIATION) {

       // if the user has indicated they'd like to evaluate and differentiate w.r.t.

       // a specific argument, then we return both the value and gradient w.r.t. that argument

       //

       // mfem::Vector arg0 = ...;

       // mfem::Vector arg1 = ...;

       // e.g. auto [value, gradient_wrt_arg1] = my_functional(arg0, differentiate_wrt(arg1));

       return {output_T_[0], grad_[wrt]};

     }


     if constexpr (wrt == NO_DIFFERENTIATION) {

       // if the user passes only `mfem::Vector`s then we assume they only want the output value

       //

       // mfem::Vector arg0 = ...;

       // mfem::Vector arg1 = ...;

       // e.g. mfem::Vector value = my_functional(arg0, arg1);

       return output_T_[0];

     }

   }


   template <typename... T>

   auto operator()(double t, const T&... args)

   {

     // below we add 0 so the number of differentiated arguments defaults to 0 if trial spaces are not provided

     constexpr int num_differentiated_arguments = (std::is_same_v<T, differentiate_wrt_this> + ... + 0);

     static_assert(num_differentiated_arguments <= 1,

                   "Error: Functional::operator() can only differentiate w.r.t. 1 argument a time");

     static_assert(sizeof...(T) == num_trial_spaces,

                   "Error: Functional::operator() must take exactly as many arguments as trial spaces");


     [[maybe_unused]] constexpr uint32_t i = index_of_differentiation<T...>();


     return (*this)(DifferentiateWRT<i>{}, t, args...);

   }


 private:

   enum class Operation

   {

     Mult,

     GradientMult

   };


   class Gradient {

   public:

     Gradient(Functional<double(trials...)>& f, uint32_t which = 0)

         : form_(f), which_argument(which), gradient_L_(f.trial_space_[which]->GetVSize())

     {

     }


     void Mult(const mfem::Vector& x, mfem::Vector& y) const { form_.GradientMult(x, y); }


     double operator()(const mfem::Vector& x) const { return form_.ActionOfGradient(x, which_argument); }


     std::unique_ptr<mfem::HypreParVector> assemble()

     {

       // The mfem method ParFiniteElementSpace.NewTrueDofVector should really be marked const

       std::unique_ptr<mfem::HypreParVector> gradient_T(

           const_cast<mfem::ParFiniteElementSpace*>(form_.trial_space_[which_argument])->NewTrueDofVector());


       gradient_L_ = 0.0;


       std::map<mfem::Geometry::Type, ExecArray<double, 3, exec>> element_gradients[Domain::num_types];


       for (auto& integral : form_.integrals_) {

         auto& K_elem             = element_gradients[integral.domain_.type_];

         auto& trial_restrictions = form_.G_trial_[integral.domain_.type_][which_argument].restrictions;


         if (K_elem.empty()) {

           for (auto& [geom, trial_restriction] : trial_restrictions) {

             K_elem[geom] = ExecArray<double, 3, exec>(trial_restriction.num_elements, 1,

                                                       trial_restriction.nodes_per_elem * trial_restriction.components);


             detail::zero_out(K_elem[geom]);

           }

         }


         integral.ComputeElementGradients(K_elem, which_argument);

       }


       for (auto type : {Domain::Type::Elements, Domain::Type::BoundaryElements}) {

         auto& K_elem             = element_gradients[type];

         auto& trial_restrictions = form_.G_trial_[type][which_argument].restrictions;


         if (!K_elem.empty()) {

           for (auto [geom, elem_matrices] : K_elem) {

             std::vector<DoF> trial_vdofs(trial_restrictions[geom].nodes_per_elem * trial_restrictions[geom].components);


             for (axom::IndexType e = 0; e < elem_matrices.shape()[0]; e++) {

               trial_restrictions[geom].GetElementVDofs(e, trial_vdofs);


               // note: elem_matrices.shape()[1] is 1 for a QoI

               for (axom::IndexType i = 0; i < elem_matrices.shape()[1]; i++) {

                 for (axom::IndexType j = 0; j < elem_matrices.shape()[2]; j++) {

                   int sign = trial_vdofs[uint32_t(j)].sign();

                   int col  = int(trial_vdofs[uint32_t(j)].index());

                   gradient_L_[col] += sign * elem_matrices(e, i, j);

                 }

               }

             }

           }

         }

       }


       form_.P_trial_[which_argument]->MultTranspose(gradient_L_, *gradient_T);


       return gradient_T;

     }


     friend auto assemble(Gradient& g) { return g.assemble(); }


   private:

     Functional<double(trials...), exec>& form_;


     uint32_t which_argument;


     mfem::Vector gradient_L_;

   };


   const mfem::L2_FECollection       test_fec_;

   const mfem::ParFiniteElementSpace test_space_;


   std::array<const mfem::ParFiniteElementSpace*, num_trial_spaces> trial_space_;


   const mfem::Operator* P_trial_[num_trial_spaces];


   mutable mfem::Vector input_L_[num_trial_spaces];


   BlockElementRestriction G_trial_[Domain::num_types][num_trial_spaces];


   mutable std::vector<mfem::BlockVector> input_E_[Domain::num_types];


   std::vector<Integral> integrals_;


   mutable mfem::BlockVector output_E_[Domain::num_types];


   QoIElementRestriction G_test_;


   mutable mfem::Vector output_L_;


   QoIProlongation P_test_;


   mutable mfem::Vector output_T_;


   mutable std::vector<Gradient> grad_;

 };


 }  // namespace serac

serac::Functional< double(trials...), exec >::Functional
Functional(std::array< const mfem::ParFiniteElementSpace *, num_trial_spaces > trial_fes)
Constructs using a mfem::ParFiniteElementSpace object corresponding to the trial space.
Definition: functional_qoi.inl:83

serac::Functional< double(trials...), exec >::AddAreaIntegral
void AddAreaIntegral(DependsOn< args... > which_args, lambda &&integrand, mfem::Mesh &domain, std::shared_ptr< QuadratureData< qpt_data_type >> &data=NoQData)
Adds an area integral, i.e., over 2D elements in R^2.
Definition: functional_qoi.inl:242

serac::Functional< double(trials...), exec >::AddVolumeIntegral
void AddVolumeIntegral(DependsOn< args... > which_args, lambda &&integrand, mfem::Mesh &domain, std::shared_ptr< QuadratureData< qpt_data_type >> &data=NoQData)
Adds a volume integral, i.e., over 3D elements in R^3.
Definition: functional_qoi.inl:259

serac::Functional< double(trials...), exec >::AddBoundaryIntegral
void AddBoundaryIntegral(Dimension< dim >, DependsOn< args... >, lambda &&integrand, const Domain &domain)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition: functional_qoi.inl:218

serac::Functional< double(trials...), exec >::operator()
auto operator()(double t, const T &... args)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition: functional_qoi.inl:380

serac::Functional< double(trials...), exec >::AddDomainIntegral
void AddDomainIntegral(Dimension< dim >, DependsOn< args... >, lambda &&integrand, Domain &domain, std::shared_ptr< QuadratureData< qpt_data_type >> qdata=NoQData)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition: functional_qoi.inl:177

serac::Functional< double(trials...), exec >::operator()
operator_paren_return< wrt >::type operator()(DifferentiateWRT< wrt >, double t, const T &... args)
this function lets the user evaluate the serac::Functional with the given trial space values
Definition: functional_qoi.inl:323

serac::Functional< double(trials...), exec >::AddBoundaryIntegral
void AddBoundaryIntegral(Dimension< dim >, DependsOn< args... >, lambda &&integrand, mfem::Mesh &mesh)
Adds a boundary integral term to the Functional object.
Definition: functional_qoi.inl:204

serac::Functional< double(trials...), exec >::AddSurfaceIntegral
void AddSurfaceIntegral(DependsOn< args... > which_args, lambda &&integrand, mfem::Mesh &domain)
alias for Functional::AddBoundaryIntegral(Dimension<2>{}, integrand, domain);
Definition: functional_qoi.inl:267

serac::Functional< double(trials...), exec >::ActionOfGradient
double ActionOfGradient(const mfem::Vector &input_T, uint32_t which) const
this function computes the directional derivative of the quantity of interest functional
Definition: functional_qoi.inl:282

serac::Functional< double(trials...), exec >::AddDomainIntegral
void AddDomainIntegral(Dimension< dim >, DependsOn< args... >, lambda &&integrand, mfem::Mesh &mesh, std::shared_ptr< QuadratureData< qpt_data_type >> qdata=NoQData)
Adds a domain integral term to the Functional object.
Definition: functional_qoi.inl:160

serac
Accelerator functionality.
Definition: serac.cpp:38

serac::EntireBoundary
Domain EntireBoundary(const mfem::Mesh &mesh)
constructs a domain from all the boundary elements in a mesh
Definition: domain.cpp:418

serac::NoQData
std::shared_ptr< QuadratureData< Nothing > > NoQData
a single instance of a QuadratureData container of Nothings, since they are all interchangeable
Definition: quadrature_data.cpp:18

serac::max
SERAC_HOST_DEVICE auto max(dual< gradient_type > a, double b)
Implementation of max for dual numbers.
Definition: dual.hpp:230

serac::check_for_missing_nodal_gridfunc
void check_for_missing_nodal_gridfunc(const mfem::Mesh &mesh)
function for verifying that the mesh has been fully initialized
Definition: functional.hpp:73

serac::index_of_differentiation
constexpr uint32_t index_of_differentiation()
given a list of types, this function returns the index that corresponds to the type dual_vector.
Definition: functional.hpp:49

serac::boundary_geometry_counts
std::array< uint32_t, mfem::Geometry::NUM_GEOMETRIES > boundary_geometry_counts(const mfem::Mesh &mesh)
count the number of boundary elements of each geometry in a mesh
Definition: geometry.hpp:83

serac::type
constexpr SERAC_HOST_DEVICE auto type(const tuple< T... > &values)
a function intended to be used for extracting the ith type from a tuple.
Definition: tuple.hpp:274

serac::ExecutionSpace
ExecutionSpace
enum used for signalling whether or not to perform certain calculations on the CPU or GPU
Definition: accelerator.hpp:69

serac::check_for_unsupported_elements
void check_for_unsupported_elements(const mfem::Mesh &mesh)
function for verifying that there are no unsupported element types in the mesh
Definition: functional.hpp:82

serac::EntireDomain
Domain EntireDomain(const mfem::Mesh &mesh)
constructs a domain from all the elements in a mesh
Definition: domain.cpp:382

serac::geometry_counts
std::array< uint32_t, mfem::Geometry::NUM_GEOMETRIES > geometry_counts(const mfem::Mesh &mesh)
count the number of elements of each geometry in a mesh
Definition: geometry.hpp:70

serac::BlockElementRestriction
a generalization of mfem::ElementRestriction that works with multiple kinds of element geometries....
Definition: element_restriction.hpp:209

serac::DependsOn
Definition: functional.hpp:35

serac::DifferentiateWRT
Definition: differentiate_wrt.hpp:15

serac::Dimension
Compile-time alias for a dimension.
Definition: geometry.hpp:11

serac::Domain
a class for representing a geometric region that can be used for integration
Definition: domain.hpp:21

serac::Domain::num_types
static constexpr int num_types
the number of entries in the Type enum
Definition: domain.hpp:29

serac::Domain::dim_
int dim_
the geometric dimension of the domain
Definition: domain.hpp:35

serac::Domain::mesh_
const mfem::Mesh & mesh_
the underyling mesh for this domain
Definition: domain.hpp:32

serac::Nothing
these classes are a little confusing. These two special types represent the similar (but different) c...
Definition: quadrature_data.hpp:38

serac::QOI
"Quantity of Interest" elements (i.e. elements with a single shape function, 1)
Definition: finite_element.hpp:229

serac::QoIElementRestriction
this class behaves like a Restriction operator, except is specialized for the case of a quantity of i...
Definition: functional_qoi.inl:45

serac::QoIElementRestriction::ScatterAdd
void ScatterAdd(const mfem::Vector &input, mfem::Vector &output) const
element-to-global ScatterAdd operation used in FEM assembly, for quantities of interest
Definition: functional_qoi.inl:52

serac::QoIProlongation
this class behaves like a Prolongation operator, except is specialized for the case of a quantity of ...
Definition: functional_qoi.inl:20

serac::QoIProlongation::MultTranspose
void MultTranspose(const mfem::Vector &input, mfem::Vector &output) const
set the value of output to the distributed sum over input values from different processors
Definition: functional_qoi.inl:30

serac::QoIProlongation::QoIProlongation
QoIProlongation(MPI_Comm c)
create a QoIProlongation for a Quantity of Interest
Definition: functional_qoi.inl:24

serac::QoIProlongation::comm
MPI_Comm comm
MPI communicator used to carry out the distributed reduction.
Definition: functional_qoi.inl:37

serac::QoIProlongation::Mult
void Mult(const mfem::Vector &, mfem::Vector &) const
unimplemented: do not use
Definition: functional_qoi.inl:27

serac::QuadratureData
A class for storing and access user-defined types at quadrature points.
Definition: quadrature_data.hpp:112

serac::tuple
This is a class that mimics most of std::tuple's interface, except that it is usable in CUDA kernels ...
Definition: tuple.hpp:28