next/Op__Dift__VEF__Face__Gen_8tpp_source.html

/****************************************************************************

* Copyright (c) 2025, CEA

* All rights reserved.

*

* Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:

* 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.

* 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.

* 3. Neither the name of the copyright holder nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission.

*

* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.

* IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;

* OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

*

*****************************************************************************/


#ifndef Op_Dift_VEF_Face_Gen_TPP_included

#define Op_Dift_VEF_Face_Gen_TPP_included


#include <Modele_turbulence_scal_base.h>

#include <Echange_externe_impose.h>

#include <Scalaire_impose_paroi.h>

#include <Neumann_sortie_libre.h>

#include <Op_Diff_VEF_base.h>

#include <Neumann_homogene.h>

#include <Neumann_paroi.h>

#include <Periodique.h>

#include <Champ_P1NC.h>

#include <Symetrie.h>

#include <Device.h>

#include <kokkos++.h>

#include <TRUSTArray_kokkos.tpp>


template <typename DERIVED_T> template <Type_Champ _TYPE_>


void Op_Dift_VEF_Face_Gen<DERIVED_T>::fill_grad_Re(const DoubleTab& tab_inconnue, const DoubleTab& tab_resu, const DoubleTab& tab_nu, const DoubleTab& tab_nu_turb) const

{


  constexpr bool is_VECT = (_TYPE_ == Type_Champ::VECTORIEL);

  if (is_VECT)

    {

      const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


      const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

      const Domaine_VEF& domaine_VEF = z_class->domaine_vef();


      // Build the array grad_ if necessary

      if (!grad_.get_md_vector().non_nul())

        {

          grad_.resize(0, Objet_U::dimension, Objet_U::dimension);

          domaine_VEF.domaine().creer_tableau_elements(grad_);

        }

      grad_ = 0.;


      Champ_P1NC::calcul_gradient(tab_inconnue, grad_, domaine_Cl_VEF);


      if (z_class->get_modele_turbulence().utiliser_loi_paroi())

        Champ_P1NC::calcul_duidxj_paroi(grad_, tab_nu, tab_nu_turb, z_class->get_tau_tan(), domaine_Cl_VEF);


      grad_.echange_espace_virtuel();


      if (!Re_.get_md_vector().non_nul())

        {

          Re_.resize(0, Objet_U::dimension, Objet_U::dimension);

          domaine_VEF.domaine().creer_tableau_elements(Re_);

        }

      Re_ = 0.;


      bool flag = z_class->get_modele_turbulence().calcul_tenseur_Re(tab_nu_turb, grad_, Re_);

      const int nbr_comp = tab_resu.line_size();

      assert(nbr_comp > 1);

      CDoubleTabView nu_turb = tab_nu_turb.view_ro();

      DoubleTabView3 Re = Re_.view_rw<3>();

      if (flag)

        {

          Cerr << "Using non-linear turbulent diffusion in NS" << finl;

          Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), range_2D({0,0}, {domaine_VEF.nb_elem(),nbr_comp}), KOKKOS_LAMBDA(const int elem, const int i)

          {

//            for (int i = 0; i < nbr_comp; i++)

            for (int j = 0; j < nbr_comp; j++)

              Re(elem, i, j) *= nu_turb(elem, 0);

          });

        }

      else

        {

          CDoubleTabView3 grad = grad_.view_ro<3>();

          // PL: range_3D plus lent que range_2D...

          //Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), range_3D({0,0,0}, {nb_elem,nbr_comp,nbr_comp}), KOKKOS_LAMBDA(const int elem, const int i, const int j)

          Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), range_2D({0,0}, {domaine_VEF.nb_elem(),nbr_comp}), KOKKOS_LAMBDA(const int elem, const int i)

          {

//          for (int i = 0; i < nbr_comp; i++)

            for (int j = 0; j < nbr_comp; j++)

              Re(elem, i, j) = nu_turb(elem,0) * (grad(elem, i, j) + grad(elem, j, i));

          });

        }

      end_gpu_timer(__KERNEL_NAME__);

      Re_.echange_espace_virtuel();

    }

}


/*

 * ***************************

 *  METHODS FOR THE EXPLICIT SCHEME

 * ***************************

 */


template <typename DERIVED_T> template<Type_Champ _TYPE_, bool _IS_RANS_>

std::enable_if_t<_TYPE_ == Type_Champ::VECTORIEL, void>


Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_bord_gen(const DoubleTab& tab_inconnue, DoubleTab& tab_resu, DoubleTab& tab_flux_bords, const DoubleTab& tab_nu, const DoubleTab& tab_nu_turb) const

{

  // Kokkos tip: rename TRUST tab (ig: parametars) and use current name for view: limite code changes.

  // Future: parameter will be views not TRUST arrays and it will be easier to refact by find/replace "const DoubleTab& tab_XXX" by "CDoubleTabView XXX"

  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


  const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

  const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

  const int nbr_comp = tab_resu.line_size();


  // loop over boundary conditions

  const Conds_lim& les_cl = domaine_Cl_VEF.les_conditions_limites();

  const int nb_cl = les_cl.size();

  CIntTabView face_voisins = domaine_VEF.face_voisins().view_ro();;

  CDoubleTabView face_normale = domaine_VEF.face_normales().view_ro();;

  CDoubleTabView nu = tab_nu.view_ro();

  CDoubleTabView3 Re = Re_.view_ro<3>();

  CDoubleTabView3 grad = grad_.view_ro<3>();

  DoubleTabView flux_bords = tab_flux_bords.view_rw();

  DoubleTabView resu = tab_resu.view_rw();

  for (int n_bord = 0; n_bord < nb_cl; n_bord++)

    {

      const Cond_lim& la_cl = domaine_Cl_VEF.les_conditions_limites(n_bord);

      const Front_VF& le_bord = ref_cast(Front_VF, la_cl->frontiere_dis());

      const int ndeb = le_bord.num_premiere_face(), nfin = ndeb + le_bord.nb_faces();


      if (sub_type(Periodique, la_cl.valeur()))

        Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__),

                             Kokkos::RangePolicy<>(ndeb, nfin), KOKKOS_LAMBDA(

                               const int num_face)

        {

          for (int kk = 0; kk < 2; kk++)

            {

              const int elem = face_voisins(num_face, kk), ori = 1 - 2 * kk;

              for (int i = 0; i < nbr_comp; i++)

                for (int j = 0; j < nbr_comp; j++)

                  resu(num_face, i) -=

                    ori * face_normale(num_face, j) * (nu(elem, 0) * grad(elem, i, j) + Re(elem, i, j));

            }

        });

      else // non-periodic BC

        {

          bool Symetrie = sub_type(Symetrie, la_cl.valeur());

          Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__),

                               Kokkos::RangePolicy<>(ndeb, nfin), KOKKOS_LAMBDA(

                                 const int num_face)

          {

            const int elem = face_voisins(num_face, 0);

            for (int i = 0; i < nbr_comp; i++)

              for (int j = 0; j < nbr_comp; j++)

                {

                  double flux = face_normale(num_face, j) * (nu(elem, 0) * grad(elem, i, j) + Re(elem, i, j));

                  resu(num_face, i) -= flux;

                  flux_bords(num_face, i) -= flux;

                }


            // Correction of tab_flux_bords for symmetry

            if (Symetrie)

              flux_bords(num_face, 0) = 0.;

          });

        }

      end_gpu_timer(__KERNEL_NAME__);

    }

}


struct AjouterInterneData

{

  // execution window

  int nint;

  int nb_faces;


  // inputs

  CIntTabView        face_voisins;

  CDoubleTabView     face_normale;

  CDoubleArrView     nu;

  CDoubleTabView3    Re;

  CDoubleTabView3    grad;


  // output

  DoubleTabView      resu;

};


inline void apply_ajouter_interne_gen_kernel_notemplate(const AjouterInterneData& data, const int nbr_comp)

{

  // Unpack on host side BEFORE passing to kernel

  const int nint         = data.nint;

  const int nb_faces     = data.nb_faces;

  auto face_voisins      = data.face_voisins;

  auto face_normale      = data.face_normale;

  auto nu                = data.nu;

  auto Re                = data.Re;

  auto grad              = data.grad;

  auto resu              = data.resu;


  // PL: collapsing loops even with an atomic is x2-3 faster than no collapsing (seen on DomainFlowLES_BENCH)

  bool collapse_loops = true;

  if (collapse_loops)

    {

      Kokkos::MDRangePolicy<Kokkos::Rank<2>> policy({nint, 0}, {nb_faces, 2});

      Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), policy, KOKKOS_LAMBDA(const int num_face, const int kk)

      {

        const int elem = face_voisins(num_face, kk), ori = 1 - 2 * kk;

        double nu_elem = nu(elem);

        for (int i = 0; i < nbr_comp; i++)

          for (int j = 0; j < nbr_comp; j++)

            Kokkos::atomic_add(&resu(num_face, i), - ori * face_normale(num_face, j) * (nu_elem * grad(elem, i, j) + Re(elem, i, j)));

      });

    }

  else

    {

      Kokkos::RangePolicy<> policy(nint, nb_faces);

      Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), policy, KOKKOS_LAMBDA(

                             const int num_face)

      {

        for (int kk = 0; kk < 2; kk++)

          {

            const int elem = face_voisins(num_face, kk), ori = 1 - 2 * kk;

            double nu_elem = nu(elem);

            for (int i = 0; i < nbr_comp; i++)

              for (int j = 0; j < nbr_comp; j++)

                resu(num_face, i) -=

                  ori * face_normale(num_face, j) * (nu_elem * grad(elem, i, j) + Re(elem, i, j));

          }

      });

    }

  end_gpu_timer(__KERNEL_NAME__);

}


template<int nbr_comp>

void apply_ajouter_interne_gen_kernel(const AjouterInterneData& data)

{

  // Unpack on host side BEFORE passing to kernel

  const int nint         = data.nint;

  const int nb_faces     = data.nb_faces;

  auto face_voisins      = data.face_voisins;

  auto face_normale      = data.face_normale;

  auto nu                = data.nu;

  auto Re                = data.Re;

  auto grad              = data.grad;

  auto resu              = data.resu;


  // Deduce policy

  Kokkos::RangePolicy<> policy(nint, nb_faces);


  Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), policy,

                       KOKKOS_LAMBDA(const int num_face)

  {

    double resu_loc[2][nbr_comp];

    double face_normale_loc[nbr_comp];

    int    face_voisins_loc[2];


    // Load per-face data from global memory once

    for (int j = 0; j < nbr_comp; ++j)

      face_normale_loc[j] = face_normale(num_face, j);


    for (int side = 0; side < 2; ++side)

      {

        face_voisins_loc[side] = face_voisins(num_face, side);

        for (int i = 0; i < nbr_comp; ++i) resu_loc[side][i] = 0.0;

      }


    // Compute local contributions

    for (int side = 0; side < 2; ++side)

      {

        const int elem = face_voisins_loc[side];

        const int ori  = 1 - 2 * side;

        const double nu_elem = nu(elem);


        for (int i = 0; i < nbr_comp; ++i)

          {

            double sum = 0.0;

            for (int j = 0; j < nbr_comp; ++j)

              {

                sum -= ori * face_normale_loc[j]

                       * (nu_elem * grad(elem, i, j) + Re(elem, i, j));

              }

            resu_loc[side][i] += sum;

          }

      }


    // Reduce two sides and write back

    for (int i = 0; i < nbr_comp; ++i)

      {

        double sum = 0.0;

        for (int side = 0; side < 2; ++side) sum += resu_loc[side][i];

        resu(num_face, i) += sum;

      }

  });


  end_gpu_timer(__KERNEL_NAME__);

}


// Explicit instantiations

template void apply_ajouter_interne_gen_kernel<1>(const AjouterInterneData&);

template void apply_ajouter_interne_gen_kernel<2>(const AjouterInterneData&);

template void apply_ajouter_interne_gen_kernel<3>(const AjouterInterneData&);

template void apply_ajouter_interne_gen_kernel<4>(const AjouterInterneData&);


template <typename DERIVED_T> template<Type_Champ _TYPE_, bool _IS_RANS_>

std::enable_if_t<_TYPE_ == Type_Champ::VECTORIEL, void>


Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_interne_gen(const DoubleTab& tab_inconnue,

                                                     DoubleTab& tab_resu,

                                                     DoubleTab& flux_bords,

                                                     const DoubleTab& tab_nu,

                                                     const DoubleTab& tab_nu_turb) const

{

  const Domaine_VEF& domaine_VEF = static_cast<const DERIVED_T*>(this)->domaine_vef();

  const int nb_faces = domaine_VEF.nb_faces();

  const int nint     = domaine_VEF.premiere_face_int();

  const int nbr_comp = tab_resu.line_size();


  // Build views once

  CIntTabView     face_voisins = domaine_VEF.face_voisins().view_ro();

  CDoubleTabView  face_normale = domaine_VEF.face_normales().view_ro();

  CDoubleArrView  nu           = static_cast<const ArrOfDouble&>(tab_nu).view_ro();

  CDoubleTabView3 grad         = grad_.view_ro<3>();

  CDoubleTabView3 Re           = Re_.view_ro<3>();

  DoubleTabView   resu         = tab_resu.view_rw();

  AjouterInterneData data {nint, nb_faces, face_voisins, face_normale, nu, Re, grad, resu};


  //You might not want to use the templated version for HUGE values of nbr_comp

  const bool use_templated_version=true;


  // Dispatch on compile-time component count;

  if (use_templated_version)

    {

      switch (nbr_comp)

        {

        case 1:

          apply_ajouter_interne_gen_kernel<1>(data);

          break;

        case 2:

          apply_ajouter_interne_gen_kernel<2>(data);

          break;

        case 3:

          apply_ajouter_interne_gen_kernel<3>(data);

          break;

        case 4:

          apply_ajouter_interne_gen_kernel<4>(data);

          break;

        default:

          Cerr << "nbr_comp too large (>4), no templated verison of Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_interne_gen implemented" << finl;

          Cerr<<  "Defaulting to the non templated version.";

          apply_ajouter_interne_gen_kernel_notemplate(data, nbr_comp);

        }

    }

  else

    {

      apply_ajouter_interne_gen_kernel_notemplate(data, nbr_comp);

    }

}


template <typename DERIVED_T> template<Type_Champ _TYPE_, bool _IS_RANS_>

std::enable_if_t<_TYPE_ == Type_Champ::SCALAIRE, void>


Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_bord_gen(const DoubleTab& inconnue, DoubleTab& resu, DoubleTab& tab_flux_bords, const DoubleTab& nu, const DoubleTab& nu_turb) const

{

  // Process boundary faces

  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


  const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

  const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

  const int nb_front = domaine_VEF.nb_front_Cl();


  for (int n_bord = 0; n_bord < nb_front; n_bord++)

    {

      const Cond_lim& la_cl = domaine_Cl_VEF.les_conditions_limites(n_bord);

      if (sub_type(Periodique, la_cl.valeur()))

        ajouter_bord_perio_gen__<_TYPE_, Type_Schema::EXPLICITE, false, _IS_RANS_>(n_bord, inconnue, &resu, nullptr, nu, nu_turb, nu_turb /* scratch */);

      else // non-periodic BC

        {

          if (sub_type(Scalaire_impose_paroi, la_cl.valeur()) || sub_type(Neumann_paroi, la_cl.valeur()) || sub_type(Neumann_homogene, la_cl.valeur())) // imposed temperature BC

            ajouter_bord_scalaire_impose_gen__<_TYPE_, Type_Schema::EXPLICITE, false>(n_bord, inconnue, &resu, nullptr, nu, nu_turb, nu_turb /* scratch */, &tab_flux_bords);


          // Do not forget!

          ajouter_bord_gen__<_TYPE_, Type_Schema::EXPLICITE, false, _IS_RANS_>(n_bord, inconnue, &resu, nullptr, nu, nu_turb, nu_turb /* scratch */, &tab_flux_bords);

        }

    }

  modifie_pour_cl_gen<false>(inconnue, resu, tab_flux_bords);

}


template <typename DERIVED_T> template <bool _IS_STAB_>


void Op_Dift_VEF_Face_Gen<DERIVED_T>::modifie_pour_cl_gen(const DoubleTab& tab_inconnue, DoubleTab& tab_resu, DoubleTab& tab_flux_bords) const

{

  // Process boundary faces

  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*

  constexpr bool is_STAB = _IS_STAB_;


  const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

  const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

  const int nb_front = domaine_VEF.nb_front_Cl(), nb_comp = tab_resu.line_size();


  for (int n_bord = 0; n_bord < nb_front; n_bord++)

    {

      const Cond_lim& la_cl = domaine_Cl_VEF.les_conditions_limites(n_bord);

      const Front_VF& le_bord = ref_cast(Front_VF, la_cl->frontiere_dis());

      const int ndeb = le_bord.num_premiere_face(), nfin = ndeb + le_bord.nb_faces();


      if (is_STAB && sub_type(Periodique, la_cl.valeur()))

        {

          const Periodique& la_cl_perio = ref_cast(Periodique, la_cl.valeur());

          CIntArrView face_associee = la_cl_perio.face_associee().view_ro();

          CIntArrView num_face = le_bord.num_face().view_ro();

          DoubleTabView resu = tab_resu.view_rw();

          Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), Kokkos::RangePolicy<>(0, le_bord.nb_faces()/2), KOKKOS_LAMBDA(const int ind_face)

          {

            const int face = num_face(ind_face);

            const int voisine = num_face(face_associee(ind_face));

            for (int nc = 0; nc < nb_comp; nc++)

              {

                resu(face, nc) += resu(voisine, nc);

                resu(voisine, nc) = resu(face, nc);

              }

          });

          end_gpu_timer(__KERNEL_NAME__);

        }


      if (sub_type(Neumann_paroi, la_cl.valeur()))

        {

          const Neumann_paroi& la_cl_paroi = ref_cast(Neumann_paroi, la_cl.valeur());

          CDoubleTabView flux_impose = la_cl_paroi.flux_impose().view_ro();

          CDoubleArrView face_surfaces = domaine_VEF.face_surfaces().view_ro();

          DoubleTabView flux_bords = tab_flux_bords.view_wo();

          DoubleTabView resu = tab_resu.view_rw();

          Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), Kokkos::RangePolicy<>(ndeb, nfin), KOKKOS_LAMBDA(const int face)

          {

            for (int nc = 0; nc < nb_comp; nc++)

              {

                const double flux = flux_impose(face - ndeb, nc) * face_surfaces(face);

                if (is_STAB) resu(face, nc) -= flux; // XXX -= car regarde dans Op_Dift_Stab_VEF_Face::ajouter

                else resu(face, nc) += flux;

                flux_bords(face, nc) = flux;

              }

          });

          end_gpu_timer(__KERNEL_NAME__);

        }


      if (sub_type(Echange_externe_impose, la_cl.valeur()))

        {

          const Echange_externe_impose& la_cl_paroi = ref_cast(Echange_externe_impose, la_cl.valeur());

          CDoubleTabView h_imp = la_cl_paroi.tab_h_imp().view_ro();

          CDoubleTabView T_ext = la_cl_paroi.tab_T_ext().view_ro();

          CDoubleArrView face_surfaces = domaine_VEF.face_surfaces().view_ro();

          CDoubleTabView inconnue = tab_inconnue.view_ro();

          DoubleTabView flux_bords = tab_flux_bords.view_wo();

          DoubleTabView resu = tab_resu.view_rw();

          Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), Kokkos::RangePolicy<>(ndeb, nfin), KOKKOS_LAMBDA(const int face)

          {

            for (int nc = 0; nc < nb_comp; nc++)

              {

                const double flux = h_imp(face - ndeb, nc) * (T_ext(face - ndeb, nc) - inconnue(face, nc)) * face_surfaces(face);

                if (is_STAB) resu(face, nc) -= flux;

                else resu(face, nc) += flux;

                flux_bords(face, nc) = flux;

              }

          });

          end_gpu_timer(__KERNEL_NAME__);

        }


      if (sub_type(Neumann_homogene, la_cl.valeur()) || sub_type(Symetrie, la_cl.valeur()) || sub_type(Neumann_sortie_libre, la_cl.valeur()))

        {

          DoubleTabView flux_bords = tab_flux_bords.view_wo();

          Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), Kokkos::RangePolicy<>(ndeb, nfin), KOKKOS_LAMBDA(const int face)

          {

            for (int nc = 0; nc < nb_comp; nc++)

              flux_bords(face, nc) = 0.;

          });

          end_gpu_timer(__KERNEL_NAME__);

        }

    }

}


/*

 * ***************************

 *  METHODS FOR THE IMPLICIT SCHEME

 * ***************************

 */

template <typename DERIVED_T> template <Type_Champ _TYPE_, bool _IS_STAB_, bool _IS_RANS_>


void Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_contribution_bord_gen(const DoubleTab& transporte, Matrice_Morse& tab_matrice, const DoubleTab& nu,

                                                                    const DoubleTab& nu_turb, const DoubleVect& porosite_eventuelle) const

{

  // Process boundary faces

  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


  const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

  const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

  const int nb_bords = domaine_VEF.nb_front_Cl(), nb_comp = transporte.line_size();


  for (int n_bord = 0; n_bord < nb_bords; n_bord++)

    {

      const Cond_lim& la_cl = domaine_Cl_VEF.les_conditions_limites(n_bord);

      const Front_VF& le_bord = ref_cast(Front_VF, la_cl->frontiere_dis());


      if (sub_type(Periodique, la_cl.valeur()))

        ajouter_bord_perio_gen__<_TYPE_, Type_Schema::IMPLICITE, _IS_STAB_, _IS_RANS_>(n_bord, transporte, nullptr, &tab_matrice, nu, nu_turb, porosite_eventuelle);

      else // non-periodic

        {

          if (sub_type(Scalaire_impose_paroi, la_cl.valeur())) // imposed temperature BC

            ajouter_bord_scalaire_impose_gen__<_TYPE_, Type_Schema::IMPLICITE, _IS_STAB_>(n_bord, transporte, nullptr, &tab_matrice, nu, nu_turb, porosite_eventuelle);

          else if (sub_type(Echange_externe_impose, la_cl.valeur()) && nb_comp < 2) // XXX: later for multi-unknown too ...

            {

              const Echange_externe_impose& la_cl_paroi = ref_cast(Echange_externe_impose, la_cl.valeur());

              const int ndeb = le_bord.num_premiere_face(), nfin = ndeb + le_bord.nb_faces();

              Matrice_Morse_View matrice;

              matrice.set(tab_matrice);

              CDoubleTabView h_imp = la_cl_paroi.tab_h_imp().view_ro();

              CDoubleArrView face_surfaces = domaine_VEF.face_surfaces().view_ro();

              Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), Kokkos::RangePolicy<>(ndeb, nfin), KOKKOS_LAMBDA(const int face)

              {

                matrice.add(face, face, h_imp(face - ndeb, 0) * face_surfaces(face));

              });

              end_gpu_timer(__KERNEL_NAME__);

            }


          // Do not forget!

          ajouter_bord_gen__<_TYPE_, Type_Schema::IMPLICITE, _IS_STAB_, _IS_RANS_>(n_bord, transporte, nullptr, &tab_matrice, nu, nu_turb, porosite_eventuelle);

        }

    }

}


// METHODES GENERIQUES

template <typename DERIVED_T> template <Type_Champ _TYPE_, Type_Schema _SCHEMA_, bool _IS_STAB_, bool _IS_RANS_>


void Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_bord_perio_gen__(const int n_bord, const DoubleTab& tab_inconnue, DoubleTab* tab_resu /* if explicit */, Matrice_Morse* matrice_morse /* if implicit */,

                                                               const DoubleTab& tab_nu, const DoubleTab& tab_nu_turb, const DoubleVect& tab_porosite_eventuelle, DoubleTab* tab_flux_bord) const

{

  constexpr bool is_VECT = (_TYPE_ == Type_Champ::VECTORIEL), is_EXPLICIT = (_SCHEMA_ == Type_Schema::EXPLICITE), is_STAB = _IS_STAB_, is_RANS = _IS_RANS_;


  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


  const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

  const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

  const Cond_lim& la_cl = domaine_Cl_VEF.les_conditions_limites(n_bord);

  const Front_VF& le_bord = ref_cast(Front_VF, la_cl->frontiere_dis());

  const Periodique& la_cl_perio = ref_cast(Periodique, la_cl.valeur());

  const int nb_faces_elem = domaine_VEF.domaine().nb_faces_elem(), nb_faces = domaine_VEF.nb_faces(), nb_comp = tab_inconnue.line_size();

  int num1 = 0, num2 = le_bord.nb_faces_tot(), nb_faces_bord_reel = le_bord.nb_faces();


  // deliberately iterate over only half the faces ... GF: do not process virtual faces

  num2 = is_EXPLICIT ? num2 : nb_faces_bord_reel / 2; // XXX: beware of discrepancies with multi-component version (num2 /= 2) ... also keeping explicit as num2


  CIntArrView le_bord_num_face = le_bord.num_face().view_ro();

  CIntArrView face_associee = la_cl_perio.face_associee().view_ro();

  CIntTabView elem_faces = domaine_VEF.elem_faces().view_ro();

  CIntTabView face_voisins = domaine_VEF.face_voisins().view_ro();

  CDoubleArrView volumes = domaine_VEF.volumes().view_ro();

  CDoubleArrView inverse_volumes = domaine_VEF.inverse_volumes().view_ro();

  CDoubleTabView face_normale = domaine_VEF.face_normales().view_ro();

  CDoubleArrView porosite_eventuelle = tab_porosite_eventuelle.view_ro();

  CDoubleTabView nu = tab_nu.view_ro();

  CDoubleTabView nu_turb = tab_nu_turb.view_ro();

  CDoubleTabView inconnue = tab_inconnue.view_ro();

  DoubleTabView resu;

  Matrice_Morse_View matrice;

  if (is_EXPLICIT)

    {

      assert(tab_resu != nullptr);

      assert(!is_VECT && !_IS_STAB_);

      resu = tab_resu->view_rw();

    }

  else

    {

      assert(matrice_morse != nullptr);

      matrice.set(*matrice_morse);

    }

  Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__),

                       Kokkos::RangePolicy<>(num1, num2), KOKKOS_LAMBDA(

                         const int ind_face)

  {

    int fac_asso = face_associee(ind_face);

    fac_asso = le_bord_num_face(fac_asso);

    int num_face0 = le_bord_num_face(ind_face);


    for (int l = 0; l < 2; l++)

      {

        int elem = face_voisins(num_face0, l);

        for (int i0 = 0; i0 < nb_faces_elem; i0++)

          {

            int j = elem_faces(elem, i0);


            if (is_EXPLICIT)

              {

                if ((j > num_face0) && (j != fac_asso))

                  for (int nc = 0; nc < nb_comp; nc++)

                    {

                      const double d_nu = nu(elem, (is_RANS ? 0 : nc)) + nu_turb(elem, (is_RANS ? nc : 0));

                      const double valA = z_class->viscA(num_face0, j, elem, d_nu, face_voisins, face_normale, inverse_volumes);

                      const double flux = valA * inconnue(j, nc) - valA * inconnue(num_face0, nc);

                      Kokkos::atomic_add(&resu(num_face0, nc), +flux);

                      if (j < nb_faces) // real face

                        Kokkos::atomic_add(&resu(j, nc), -0.5 * flux);

                    }

              }

            else   // implicit scheme

              {

                if (j > num_face0)

                  {

                    int orientation = 1, fac_loc = 0, ok = 1, contrib = 1;


                    if ((elem == face_voisins(j, l)) ||

                        (face_voisins(num_face0, (l + 1) % 2) == face_voisins(j, (l + 1) % 2)))

                      orientation = -1;


                    while ((fac_loc < nb_faces_elem) && (elem_faces(elem, fac_loc) != num_face0))

                      fac_loc++;


                    if (fac_loc == nb_faces_elem)

                      ok = 0;


                    if (j >= nb_faces) // virtual face

                      {

                        int el1 = face_voisins(j, 0), el2 = face_voisins(j, 1);

                        if ((el1 == -1) || (el2 == -1))

                          contrib = 0;

                      }


                    if (contrib)

                      for (int nc = 0; nc < nb_comp; nc++)

                        {

                          double d_nu = nu(elem, (is_VECT || is_RANS ) ? 0 : nc) + nu_turb(elem, (is_RANS ? nc : 0));

                          double valA = z_class->viscA(num_face0, j, elem, d_nu, face_voisins, face_normale, inverse_volumes);

                          if (is_STAB && valA < 0.)

                            valA = 0.;


                          int n0 = num_face0 * nb_comp + nc;

                          int n0perio = fac_asso * nb_comp + nc;

                          int j0 = j * nb_comp + nc;

                          matrice.atomic_add(n0, n0, + valA * porosite_eventuelle(num_face0));

                          matrice.atomic_add(n0, j0, - valA * porosite_eventuelle(j));


                          if (j < nb_faces) // Process real faces only

                            {

                              if (ok == 1)

                                matrice.atomic_add(j0, n0, - valA * porosite_eventuelle(num_face0));

                              else

                                matrice.atomic_add(j0, n0perio, - valA * porosite_eventuelle(num_face0));

                              matrice.atomic_add(j0, j0, + valA * porosite_eventuelle(j));

                            }


                          // XXX : On a l'equation QDM et donc on ajoute grad_U transpose

                          if (is_VECT)

                            for (int nc2 = 0; nc2 < nb_comp; nc2++)

                              {

                                int n1 = num_face0 * nb_comp + nc2;

                                int j1 = j * nb_comp + nc2;

                                double coeff_s = orientation * nu_turb(elem,0) / volumes(elem) *

                                                 face_normale(num_face0, nc2) * face_normale(j, nc);

                                matrice.atomic_add(n0, n1, + coeff_s * porosite_eventuelle(num_face0));

                                matrice.atomic_add(n0, j1, - coeff_s * porosite_eventuelle(j));


                                if (j < nb_faces) // Process real faces only

                                  {

                                    double coeff_s2 = orientation * nu_turb(elem,0) / volumes(elem) *

                                                      face_normale(num_face0, nc) * face_normale(j, nc2);


                                    if (ok == 1)

                                      matrice.atomic_add(j0, n1, - coeff_s2 * porosite_eventuelle(num_face0));

                                    else

                                      matrice.atomic_add(j0, fac_asso * nb_comp + nc2, - coeff_s2 * porosite_eventuelle(num_face0));


                                    matrice.atomic_add(j0, j1, + coeff_s2 * porosite_eventuelle(j));

                                  }

                              }

                        }

                  }

              }

          }

      }

  });

  end_gpu_timer(__KERNEL_NAME__);

}


template <typename DERIVED_T> template <Type_Champ _TYPE_, Type_Schema _SCHEMA_, bool _IS_STAB_>

void Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_bord_scalaire_impose_gen__(const int n_bord, const DoubleTab& tab_inconnue, DoubleTab* tab_resu /* if explicit */, Matrice_Morse* matrice_morse /* if implicit */,

                                                                         const DoubleTab& tab_nu, const DoubleTab& tab_nu_turb, const DoubleVect& tab_porosite_eventuelle, DoubleTab* tab_flux_bords) const

{

  constexpr bool is_EXPLICIT = (_SCHEMA_ == Type_Schema::EXPLICITE);


  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


  const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

  const RefObjU& modele_turbulence = domaine_Cl_VEF.equation().get_modele(TURBULENCE);

  if (sub_type(Modele_turbulence_scal_base, modele_turbulence.valeur()))

    {

      const Modele_turbulence_scal_base& mod_turb_scal = ref_cast(Modele_turbulence_scal_base, modele_turbulence.valeur());

      const Turbulence_paroi_scal_base& loiparth = mod_turb_scal.loi_paroi();

      if (loiparth.use_equivalent_distance())

        {

          // Wall laws only apply in cases where the BC is of imposed temperature type, since in the other cases

          // (imposed flux and adiabatic) the wall flux is known and fixed.

          const Cond_lim_base& cl_base = domaine_Cl_VEF.les_conditions_limites(n_bord).valeur();

          int ldp_appli = 0;

          if (sub_type(Scalaire_impose_paroi, cl_base))

            ldp_appli = 1;

          else if (loiparth.get_flag_calcul_ldp_en_flux_impose())

            if ((sub_type(Neumann_paroi, cl_base)) || (sub_type(Neumann_homogene, cl_base)))

              ldp_appli = 1;


          if (ldp_appli)

            {

              const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

              const Front_VF& le_bord = ref_cast(Front_VF, domaine_Cl_VEF.les_conditions_limites(n_bord)->frontiere_dis());

              const int nb_faces_elem = domaine_VEF.domaine().nb_faces_elem(), nb_comp = tab_inconnue.line_size(), size_flux_bords = domaine_VEF.nb_faces_bord();

              int num1 = 0, num2 = le_bord.nb_faces_tot();

              int dim = Objet_U::dimension;

              // d_equiv contains the equivalent distance for the boundary

              // In d_equiv, for faces that are not paroi_fixe (eg periodic, symmetry, etc...)

              // the geometric distance is used thanks to the initialization of the array in the wall law.

              CDoubleArrView d_equiv = loiparth.equivalent_distance(n_bord).view_ro();

              CIntArrView le_bord_num_face = le_bord.num_face().view_ro();

              CIntTabView face_voisins = domaine_VEF.face_voisins().view_ro();

              CIntTabView elem_faces = domaine_VEF.elem_faces().view_ro();

              CDoubleTabView face_normale = domaine_VEF.face_normales().view_ro();

              CDoubleArrView volumes = domaine_VEF.volumes().view_ro();

              CDoubleArrView face_surfaces = domaine_VEF.face_surfaces().view_ro();

              CDoubleArrView porosite_eventuelle = tab_porosite_eventuelle.view_ro();

              CDoubleTabView nu = tab_nu.view_ro();

              CDoubleTabView nu_turb = tab_nu_turb.view_ro();

              CDoubleTabView inconnue = tab_inconnue.view_ro();

              DoubleTabView flux_bords;

              DoubleTabView resu;

              Matrice_Morse_View matrice;

              if (is_EXPLICIT)

                {

                  assert(tab_resu != nullptr);

                  flux_bords = tab_flux_bords->view_rw();

                  resu = tab_resu->view_rw();

                }

              else

                {

                  assert(matrice_morse != nullptr);

                  matrice.set(*matrice_morse);

                }

              Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__),

                                   Kokkos::RangePolicy<>(num1, num2), KOKKOS_LAMBDA(

                                     const int ind_face)

              {

                double le_mauvais_gradient[3] = { 0., 0., 0. };

                for (int nc = 0; nc < nb_comp; nc++)

                  {

                    int num_face = le_bord_num_face(ind_face);

                    // Tf is the mean fluid temperature in the first element without considering the wall temperature.

                    double Tf = 0.;

                    double bon_gradient = 0.; // this is the norm of the temperature gradient normal to the wall


                    for (int kk = 0; kk < dim; kk++)

                      le_mauvais_gradient[kk] = 0.;


                    int elem1 = face_voisins(num_face, 0);

                    if (elem1 == -1) elem1 = face_voisins(num_face, 1);


                    // inconnue(num_face) is the wall temperature: Tw.

                    // The sign of bon_gradient does not matter since it is the norm of the temperature gradient in the element.

                    // It will then be multiplied by the normal vector to the wall face which has the correct signs.


                    if (!is_EXPLICIT)

                      bon_gradient = 1. / d_equiv(ind_face) * (-oriente_normale(num_face, elem1, face_voisins));


                    double surface_face = face_surfaces(num_face);

                    double nutotal = nu(elem1, nc) + nu_turb(elem1,0);


                    if (is_EXPLICIT)

                      {

                        for (int i = 0; i < nb_faces_elem; i++)

                          {

                            const int j = elem_faces(elem1, i);

                            if (j != num_face)

                              {

                                double surface_pond = 0.;

                                double signe_j = oriente_normale(j, elem1, face_voisins);

                                double signe_num_face = oriente_normale(num_face, elem1, face_voisins);

                                for (int kk = 0; kk < dim; kk++)

                                  surface_pond -= (face_normale(j, kk) * signe_j *

                                                   face_normale(num_face, kk) * signe_num_face) /

                                                  (surface_face * surface_face);


                                Tf += inconnue(j, nc) * surface_pond;

                              }


                            double signe_j = oriente_normale(j, elem1, face_voisins);

                            for (int kk = 0; kk < dim; kk++)

                              le_mauvais_gradient[kk] += inconnue(j, nc) * face_normale(j, kk) * signe_j;

                          }

                        for (int kk = 0; kk < dim; kk++)

                          le_mauvais_gradient[kk] /= volumes(elem1);


                        double mauvais_gradient = 0;

                        for (int kk = 0; kk < dim; kk++)

                          mauvais_gradient += le_mauvais_gradient[kk] * face_normale(num_face, kk) / surface_face;


                        // inconnue(num_face) is the wall temperature: Tw.

                        // The sign of bon_gradient does not matter since it is the norm of the temperature gradient in the element.

                        // It will then be multiplied by the normal vector to the wall face which has the correct signs.

                        double signe_num_face = oriente_normale(num_face, elem1, face_voisins);

                        bon_gradient = (Tf - inconnue(num_face, nc)) / d_equiv(ind_face) * (-signe_num_face);


                        for (int i = 0; i < nb_faces_elem; i++)

                          {

                            const int j = elem_faces(elem1, i);

                            double correction = 0.;

                            double signe_j = oriente_normale(j, elem1, face_voisins);

                            for (int kk = 0; kk < dim; kk++)

                              {

                                double resu2 =

                                  nutotal * (bon_gradient - mauvais_gradient) * face_normale(num_face, kk) *

                                  face_normale(j, kk) * (-signe_j) / surface_face;

                                correction += resu2;

                              }


                            Kokkos::atomic_add(&resu(j, nc), +correction);

                            if (j == num_face && j < size_flux_bords)

                              Kokkos::atomic_add(&flux_bords(j, nc), -correction);

                          }

                      }

                    else   // implicite

                      {

                        for (int i0 = 0; i0 < nb_faces_elem; i0++)

                          {

                            int j = elem_faces(elem1, i0);

                            for (int ii = 0; ii < nb_faces_elem; ii++)

                              {

                                for (int kk = 0; kk < dim; kk++)

                                  le_mauvais_gradient[kk] = 0;

                                int jj = elem_faces(elem1, ii);

                                double surface_pond = 0;

                                double signe_jj = oriente_normale(jj, elem1, face_voisins);

                                double signe_num_face = oriente_normale(num_face, elem1, face_voisins);

                                for (int kk = 0; kk < dim; kk++)

                                  surface_pond -= (face_normale(jj, kk) * signe_jj *

                                                   face_normale(num_face, kk) * signe_num_face) /

                                                  (surface_face * surface_face);


                                Tf = surface_pond;

                                for (int kk = 0; kk < dim; kk++)

                                  le_mauvais_gradient[kk] += face_normale(jj, kk) * signe_jj;


                                for (int kk = 0; kk < dim; kk++)

                                  le_mauvais_gradient[kk] /= volumes(elem1);


                                double mauvais_gradient = 0;

                                for (int kk = 0; kk < dim; kk++)

                                  mauvais_gradient +=

                                    le_mauvais_gradient[kk] * face_normale(num_face, kk) / surface_face;


                                double resu1 = 0, resu2 = 0;

                                double signe_j = oriente_normale(j, elem1, face_voisins);

                                for (int kk = 0; kk < dim; kk++)

                                  {

                                    double coeff = -nutotal * face_normale(num_face, kk) * face_normale(j, kk) * signe_j / surface_face;

                                    resu1 += mauvais_gradient * coeff;

                                    resu2 += bon_gradient * coeff;

                                  }

                                // bon_gradient_reel = bon_gradient*(Tf-T_face) hence the derivatives... & mauvais_gradient_reel=mauvais_gradient_j*Tj

                                if (jj == num_face)

                                  resu2 *= -1;

                                else

                                  resu2 *= Tf;


                                int j0 = j * nb_comp + nc, jj0 = jj * nb_comp + nc;

                                matrice.atomic_add(j0, jj0, (resu1 - resu2) * porosite_eventuelle(jj0));

                              }

                          }

                      }

                  }

              });

              end_gpu_timer(__KERNEL_NAME__);

            }

        }

    }

}


template <typename DERIVED_T> template <Type_Champ _TYPE_, Type_Schema _SCHEMA_, bool _IS_STAB_, bool _IS_RANS_>

void Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_bord_gen__(const int n_bord, const DoubleTab& tab_inconnue, DoubleTab* tab_resu /* if explicit */, Matrice_Morse* matrice_morse /* if implicit */,

                                                         const DoubleTab& tab_nu, const DoubleTab& tab_nu_turb, const DoubleVect& tab_porosite_eventuelle, DoubleTab* tab_flux_bords) const

{

  constexpr bool is_VECT = (_TYPE_ == Type_Champ::VECTORIEL), is_EXPLICIT = (_SCHEMA_ == Type_Schema::EXPLICITE), is_STAB = _IS_STAB_, is_RANS = _IS_RANS_;


  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


  const Domaine_Cl_VEF& domaine_Cl_VEF = z_class->domaine_cl_vef();

  const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

  const int nb_faces_elem = domaine_VEF.domaine().nb_faces_elem(), nb_faces = domaine_VEF.nb_faces(), nb_comp = tab_inconnue.line_size(), premiere_face_int = domaine_VEF.premiere_face_int();;


  const Front_VF& le_bord = ref_cast(Front_VF, domaine_Cl_VEF.les_conditions_limites(n_bord)->frontiere_dis());

  const int num1 = 0, num2 = le_bord.nb_faces_tot(), nb_faces_bord_reel = le_bord.nb_faces();


  CIntArrView le_bord_num_face = le_bord.num_face().view_ro();

  CIntTabView face_voisins = domaine_VEF.face_voisins().view_ro();

  CIntTabView elem_faces = domaine_VEF.elem_faces().view_ro();

  CDoubleTabView face_normale = domaine_VEF.face_normales().view_ro();

  CDoubleArrView volumes = domaine_VEF.volumes().view_ro();

  CDoubleArrView inverse_volumes = domaine_VEF.inverse_volumes().view_ro();

  CDoubleArrView porosite_eventuelle = tab_porosite_eventuelle.view_ro();

  CDoubleTabView nu = tab_nu.view_ro();

  CDoubleTabView nu_turb = tab_nu_turb.view_ro();

  CDoubleTabView inconnue = tab_inconnue.view_ro();

  DoubleTabView flux_bords;

  DoubleTabView resu;

  Matrice_Morse_View matrice;

  if (is_EXPLICIT)

    {

      assert(tab_resu != nullptr);

      assert(!is_VECT && !_IS_STAB_);

      flux_bords = tab_flux_bords->view_rw();

      resu = tab_resu->view_rw();

    }

  else

    {

      assert(matrice_morse != nullptr);

      matrice.set(*matrice_morse);

    }

  Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__),

                       Kokkos::RangePolicy<>(num1, num2), KOKKOS_LAMBDA(

                         const int ind_face)

  {

    const int num_face = le_bord_num_face(ind_face), elem = face_voisins(num_face, 0);

    for (int i = 0; i < nb_faces_elem; i++)

      {

        int j = elem_faces(elem, i);

        if ((j > num_face) || (ind_face >= nb_faces_bord_reel))

          {

            int orientation = 1;

            if ((elem == face_voisins(j, 0)) || (face_voisins(num_face, (0 + 1) % 2) == face_voisins(j, (0 + 1) % 2)))

              orientation = -1;


            for (int nc = 0; nc < nb_comp; nc++)

              {

                const double d_nu = nu(elem, (is_VECT || is_RANS) ? 0 : nc) + nu_turb(elem, (is_RANS ? nc : 0));

                double valA = z_class->viscA(num_face, j, elem, d_nu, face_voisins, face_normale, inverse_volumes);


                if (is_STAB && valA < 0.) valA = 0.;


                if (is_EXPLICIT)

                  {

                    if (ind_face < nb_faces_bord_reel)

                      {

                        double flux = valA * (inconnue(j, nc) - inconnue(num_face, nc));

                        Kokkos::atomic_add(&resu(num_face, nc), +flux);

                        Kokkos::atomic_add(&flux_bords(num_face, nc), -flux);

                      }

                    if (j < nb_faces) // real face

                      {

                        double flux = valA * (inconnue(num_face, nc) - inconnue(j, nc));

                        Kokkos::atomic_add(&resu(j, nc), +flux);

                        if (j < premiere_face_int)

                          Kokkos::atomic_add(&flux_bords(j, nc), -flux);

                      }

                  }

                else // implicite

                  {

                    const int n0 = num_face * nb_comp + nc, j0 = j * nb_comp + nc;

                    if (ind_face < nb_faces_bord_reel)

                      {

                        matrice.atomic_add(n0, n0, + valA * porosite_eventuelle(num_face));

                        matrice.atomic_add(n0, j0, - valA * porosite_eventuelle(j));

                      }


                    if (j < nb_faces) // real face

                      {

                        matrice.atomic_add(j0, n0, - valA * porosite_eventuelle(num_face));

                        matrice.atomic_add(j0, j0, + valA * porosite_eventuelle(j));

                      }


                    // XXX : On a l'equation QDM et donc on ajoute grad_U transpose

                    if (is_VECT)

                      for (int nc2 = 0; nc2 < nb_comp; nc2++)

                        {

                          const int n1 = num_face * nb_comp + nc2, j1 = j * nb_comp + nc2;

                          if (ind_face < nb_faces_bord_reel)

                            {

                              double coeff_s = orientation * nu_turb(elem,0) / volumes(elem) * face_normale(num_face, nc2) * face_normale(j, nc);

                              matrice.atomic_add(n0, n1, + coeff_s * porosite_eventuelle(num_face));

                              matrice.atomic_add(n0, j1, - coeff_s * porosite_eventuelle(j));

                            }


                          if (j < nb_faces) // real face

                            {

                              double coeff_s = orientation * nu_turb(elem,0) / volumes(elem) * face_normale(num_face, nc) * face_normale(j, nc2);

                              matrice.atomic_add(j0, n1, - coeff_s * porosite_eventuelle(num_face));

                              matrice.atomic_add(j0, j1, + coeff_s * porosite_eventuelle(j));

                            }

                        }

                  }

              }

          }

      }

  });

  end_gpu_timer(__KERNEL_NAME__);

}


template <typename DERIVED_T> template <Type_Champ _TYPE_, Type_Schema _SCHEMA_, bool _IS_STAB_, bool _IS_RANS_>

void Op_Dift_VEF_Face_Gen<DERIVED_T>::ajouter_interne_gen__(const DoubleTab& tab_inconnue, DoubleTab* tab_resu /* if explicit */, Matrice_Morse* matrice_morse /* if implicit */,

                                                            const DoubleTab& tab_nu, const DoubleTab& tab_nu_turb, const DoubleVect& tab_porosite_eventuelle) const

{

  constexpr bool is_VECT = (_TYPE_ == Type_Champ::VECTORIEL), is_EXPLICIT = (_SCHEMA_ == Type_Schema::EXPLICITE), is_STAB = _IS_STAB_, is_RANS = _IS_RANS_;


  const auto *z_class = static_cast<const DERIVED_T*>(this); // CRTP --> I love you :*


  const Domaine_VEF& domaine_VEF = z_class->domaine_vef();

  const int premiere_face_int = domaine_VEF.premiere_face_int(), nb_faces = domaine_VEF.nb_faces(), nb_faces_elem = domaine_VEF.domaine().nb_faces_elem(), nb_comp = tab_inconnue.line_size();


  CIntTabView face_voisins = domaine_VEF.face_voisins().view_ro();

  CIntTabView elem_faces = domaine_VEF.elem_faces().view_ro();

  CDoubleTabView face_normale = domaine_VEF.face_normales().view_ro();

  CDoubleArrView inverse_volumes = domaine_VEF.inverse_volumes().view_ro();

  CDoubleArrView porosite_eventuelle = tab_porosite_eventuelle.view_ro();

  CDoubleTabView nu = tab_nu.view_ro();

  CDoubleTabView nu_turb = tab_nu_turb.view_ro();

  CDoubleTabView inconnue = tab_inconnue.view_ro();

  DoubleTabView resu;

  Matrice_Morse_View matrice;

  if (is_EXPLICIT)

    {

      assert(tab_resu != nullptr);

      resu = tab_resu->view_rw();

    }

  else

    {

      assert(matrice_morse != nullptr);

      matrice.set(*matrice_morse);

    }

  Kokkos::MDRangePolicy<Kokkos::Rank<2>> policy({premiere_face_int, 0}, {nb_faces, 2});

  Kokkos::parallel_for(start_gpu_timer(__KERNEL_NAME__), policy, KOKKOS_LAMBDA(const int num_face, const int kk)

  {

    int elem = face_voisins(num_face, kk);

    for (int i0 = 0; i0 < nb_faces_elem; i0++)

      {

        int j = elem_faces(elem, i0);

        if (j > num_face)

          {

            int contrib = 1;

            if (j >= nb_faces) // virtual face

              {

                const int el1 = face_voisins(j, 0), el2 = face_voisins(j, 1);

                if ((el1 == -1) || (el2 == -1))

                  contrib = 0;

              }


            if (contrib)

              {

                double tmp = 0.;

                // XXX : On a l'equation QDM et donc on ajoute grad_U transpose

                if (!is_EXPLICIT && is_VECT)

                  {

                    int orientation = 1;

                    if ((elem == face_voisins(j, kk)) ||

                        (face_voisins(num_face, 1 - kk) == face_voisins(j, 1 - kk)))

                      orientation = -1;

                    tmp = orientation * nu_turb(elem,0) * inverse_volumes(elem);

                  }

                for (int nc = 0; nc < nb_comp; nc++)

                  {

                    double d_nu = nu(elem, (is_VECT || is_RANS) ? 0 : nc) + nu_turb(elem, (is_RANS ? nc : 0));

                    double valA = z_class->viscA(num_face, j, elem, d_nu, face_voisins, face_normale, inverse_volumes);


                    if (is_STAB && valA < 0.) valA = 0.;


                    if (is_EXPLICIT)

                      {

                        const double flux = valA * inconnue(j, nc) - valA * inconnue(num_face, nc);

                        Kokkos::atomic_add(&resu(num_face, nc), flux);

                        if (j < nb_faces) // Process real faces only

                          Kokkos::atomic_sub(&resu(j, nc), flux);

                      }

                    else     // METHODE IMPLICITE

                      {

                        double contrib_num_face = valA * porosite_eventuelle(num_face);

                        double contrib_j = valA * porosite_eventuelle(j);

                        const int n0 = num_face * nb_comp + nc, j0 = j * nb_comp + nc;

                        matrice.atomic_add(n0, n0, contrib_num_face);

                        matrice.atomic_add(n0, j0, -contrib_j);

                        if (j < nb_faces) // Process real faces only

                          {

                            matrice.atomic_add(j0, n0, -contrib_num_face);

                            matrice.atomic_add(j0, j0, contrib_j);

                          }


                        // XXX : On a l'equation QDM et donc on ajoute grad_U transpose

                        if (is_VECT)

                          {

                            double poro_num_face = porosite_eventuelle(num_face);

                            double poro_j = porosite_eventuelle(j);

                            double face_normale_num_face = face_normale(num_face, nc);

                            double face_normale_j = face_normale(j, nc);

                            for (int nc2 = 0; nc2 < nb_comp; nc2++)

                              {

                                const int n1 = num_face * nb_comp + nc2;

                                const int j1 = j * nb_comp + nc2;

                                double coeff_s = is_STAB ? 0. : tmp * face_normale(num_face, nc2) * face_normale_j;


                                matrice.atomic_add(n0, n1, coeff_s * poro_num_face);

                                matrice.atomic_add(n0, j1, -coeff_s * poro_j);

                                if (j < nb_faces) // Process real faces only

                                  {

                                    double coeff_s2 = is_STAB ? 0. : tmp * face_normale_num_face * face_normale(j, nc2);

                                    matrice.atomic_add(j0, n1, -coeff_s2 * poro_num_face);

                                    matrice.atomic_add(j0, j1, coeff_s2 * poro_j);

                                  }

                              }

                          }

                      }

                  }

              }

          }

      }

  });

  end_gpu_timer(__KERNEL_NAME__);

}


#endif /* Op_Dift_VEF_Face_Gen_TPP_included */


Champ_P1NC::calcul_gradient
static DoubleTab & calcul_gradient(const DoubleTab &, DoubleTab &, const Domaine_Cl_VEF &)
Definition Champ_P1NC.cpp:912

Champ_P1NC::calcul_duidxj_paroi
static DoubleTab & calcul_duidxj_paroi(DoubleTab &, const DoubleTab &, const DoubleTab &, const DoubleTab &, const Domaine_Cl_VEF &)
Definition Champ_P1NC.cpp:920

Cond_lim_base
class Cond_lim_base Base class for the hierarchy of classes that represent the different boundary con...
Definition Cond_lim_base.h:40

Cond_lim
class Cond_lim Generic class used to represent any class
Definition Cond_lim.h:31

Conds_lim
class Conds_lim This class represents a vector of boundary conditions.
Definition Conds_lim.h:32

Domaine_32_64::creer_tableau_elements
virtual void creer_tableau_elements(Array_base &, RESIZE_OPTIONS opt=RESIZE_OPTIONS::COPY_INIT) const
Creates a parallel array of values at elements.
Definition Domaine.cpp:850

Domaine_32_64::nb_faces_elem
int nb_faces_elem(int=0) const
Returns the number of faces of type i of the geometric elements that make up the domain.
Definition Domaine.h:484

Domaine_Cl_VEF
Definition Domaine_Cl_VEF.h:38

Domaine_Cl_dis_base::les_conditions_limites
const Cond_lim & les_conditions_limites(int) const
Returns the i-th boundary condition.
Definition Domaine_Cl_dis_base.cpp:386

Domaine_VEF
class Domaine_VEF
Definition Domaine_VEF.h:53

Domaine_VF::face_surfaces
virtual const DoubleVect & face_surfaces() const
Definition Domaine_VF.h:51

Domaine_VF::nb_faces
int nb_faces() const
Returns the total number of faces.
Definition Domaine_VF.h:471

Domaine_VF::face_normales
virtual double face_normales(int face, int comp) const
Definition Domaine_VF.h:47

Domaine_VF::volumes
double volumes(int i) const
Definition Domaine_VF.h:113

Domaine_VF::elem_faces
int elem_faces(int i, int j) const
Returns the index of the i-th face of element num_elem; the face numbering convention is.
Definition Domaine_VF.h:542

Domaine_VF::premiere_face_int
int premiere_face_int() const
A face is internal if and only if it separates two elements.
Definition Domaine_VF.h:463

Domaine_VF::face_voisins
int face_voisins(int num_face, int i) const
Returns the neighbouring element of num_face in direction i.
Definition Domaine_VF.h:418

Domaine_VF::nb_faces_bord
int nb_faces_bord() const
Returns the number of faces on which boundary conditions are applied:
Definition Domaine_VF.h:512

Domaine_VF::inverse_volumes
double inverse_volumes(int i) const
Definition Domaine_VF.h:114

Domaine_dis_base::nb_elem
int nb_elem() const
Definition Domaine_dis_base.h:49

Domaine_dis_base::nb_front_Cl
int nb_front_Cl() const
Definition Domaine_dis_base.h:53

Domaine_dis_base::domaine
const Domaine & domaine() const
Definition Domaine_dis_base.h:46

Echange_externe_impose
Classe Echange_externe_impose: This class represents the special case of the class.
Definition Echange_externe_impose.h:46

Echange_impose_base::tab_h_imp
const DoubleTab & tab_h_imp(double temps=DMAXFLOAT) const
Definition Echange_impose_base.cpp:284

Echange_impose_base::tab_T_ext
const DoubleTab & tab_T_ext(double temps=DMAXFLOAT) const
Definition Echange_impose_base.cpp:258

Equation_base::get_modele
virtual const RefObjU & get_modele(Type_modele type) const
Definition Equation_base.cpp:1894

Front_VF
class Front_VF
Definition Front_VF.h:36

Front_VF::nb_faces
int nb_faces() const
Definition Front_VF.h:53

Front_VF::num_premiere_face
int num_premiere_face() const
Definition Front_VF.h:63

Front_VF::nb_faces_tot
int nb_faces_tot() const
Definition Front_VF.h:58

Front_VF::num_face
int num_face(const int) const
Definition Front_VF.h:68

Matrice_Morse
Matrice_Morse class - Represents a (sparse) matrix M, not necessarily square,.
Definition Matrice_Morse.h:50

Modele_turbulence_scal_base
Base class for scalar turbulence models coupled to a Navier-Stokes convection-diffusion equation.
Definition Modele_turbulence_scal_base.h:38

Modele_turbulence_scal_base::loi_paroi
const Turbulence_paroi_scal_base & loi_paroi() const
Returns the scalar wall-law turbulence model (const version).
Definition Modele_turbulence_scal_base.h:88

MorEqn::equation
const Equation_base & equation() const
Returns the reference to the equation pointed to by MorEqn::mon_equation.
Definition MorEqn.h:62

Neumann_homogene
Classe Neumann_homogene This class is the base class of the hierarchy of homogeneous Neumann-type bou...
Definition Neumann_homogene.h:31

Neumann_paroi
Classe Neumann_paroi This boundary condition corresponds to an imposed flux for the.
Definition Neumann_paroi.h:29

Neumann_sortie_libre
Neumann_sortie_libre This class represents an open boundary without imposed velocity.
Definition Neumann_sortie_libre.h:34

Neumann::flux_impose
virtual double flux_impose(int i) const
Returns the value of the imposed flux on the i-th component of the field representing the flux at the...
Definition Neumann.cpp:35

Objet_U::dimension
static int dimension
Definition Objet_U.h:94

Op_Dift_VEF_Face_Gen::ajouter_bord_gen
std::enable_if_t< _TYPE_==Type_Champ::VECTORIEL, void > ajouter_bord_gen(const DoubleTab &, DoubleTab &, DoubleTab &, const DoubleTab &, const DoubleTab &) const
Definition Op_Dift_VEF_Face_Gen.tpp:106

Op_Dift_VEF_Face_Gen< Op_Diff_K_Eps_VEF_Face >::grad_
DoubleTab grad_
Definition Op_Dift_VEF_Face_Gen.h:65

Op_Dift_VEF_Face_Gen::modifie_pour_cl_gen
void modifie_pour_cl_gen(const DoubleTab &, DoubleTab &, DoubleTab &) const
Definition Op_Dift_VEF_Face_Gen.tpp:389

Op_Dift_VEF_Face_Gen::fill_grad_Re
void fill_grad_Re(const DoubleTab &, const DoubleTab &, const DoubleTab &, const DoubleTab &) const
Definition Op_Dift_VEF_Face_Gen.tpp:34

Op_Dift_VEF_Face_Gen::ajouter_contribution_bord_gen
void ajouter_contribution_bord_gen(const DoubleTab &, Matrice_Morse &, const DoubleTab &, const DoubleTab &, const DoubleVect &) const
Definition Op_Dift_VEF_Face_Gen.tpp:485

Op_Dift_VEF_Face_Gen< Op_Diff_K_Eps_VEF_Face >::Re_
DoubleTab Re_
Definition Op_Dift_VEF_Face_Gen.h:65

Op_Dift_VEF_Face_Gen::ajouter_interne_gen
std::enable_if_t< _TYPE_==Type_Champ::VECTORIEL, void > ajouter_interne_gen(const DoubleTab &, DoubleTab &, DoubleTab &, const DoubleTab &, const DoubleTab &) const
Definition Op_Dift_VEF_Face_Gen.tpp:307

Periodique
class Periodique This class represents a periodic boundary condition.
Definition Periodique.h:31

Periodique::face_associee
int face_associee(int i) const
Definition Periodique.h:35

Scalaire_impose_paroi
Scalaire_impose_paroi Imposes a scalar at the wall in a Convection-Diffusion equation for a scalar.
Definition Scalaire_impose_paroi.h:26

Symetrie
Symetrie On symmetry faces, the following properties hold:
Definition Symetrie.h:37

TRUSTTab::view_wo
std::enable_if_t< is_default_exec_space< EXEC_SPACE >, View< _TYPE_, _SHAPE_ > > view_wo()
Definition TRUSTTab.h:276

TRUSTTab::view_ro
std::enable_if_t< is_default_exec_space< EXEC_SPACE >, ConstView< _TYPE_, _SHAPE_ > > view_ro() const
Definition TRUSTTab.h:261

TRUSTTab::view_rw
std::enable_if_t< is_default_exec_space< EXEC_SPACE >, View< _TYPE_, _SHAPE_ > > view_rw()
Definition TRUSTTab.h:291

TRUSTVect::line_size
int line_size() const
Definition TRUSTVect.tpp:67

TRUST_Ref_Objet_U::valeur
const Objet_U & valeur() const
Definition TRUST_Ref.h:134

Turbulence_paroi_scal_base
Base class for the hierarchy of scalar wall-law models computing turbulent quantities near walls....
Definition Turbulence_paroi_scal_base.h:39

Turbulence_paroi_scal_base::use_equivalent_distance
virtual bool use_equivalent_distance() const
Give a boolean indicating if we need to use equivant distance by default we consider that we use the ...
Definition Turbulence_paroi_scal_base.cpp:177

Turbulence_paroi_scal_base::equivalent_distance
const DoubleVects & equivalent_distance() const
Definition Turbulence_paroi_scal_base.h:78

Turbulence_paroi_scal_base::get_flag_calcul_ldp_en_flux_impose
const int & get_flag_calcul_ldp_en_flux_impose() const
Definition Turbulence_paroi_scal_base.h:73

AjouterInterneData
Definition Op_Dift_VEF_Face_Gen.tpp:173

AjouterInterneData::grad
CDoubleTabView3 grad
Definition Op_Dift_VEF_Face_Gen.tpp:183

AjouterInterneData::nint
int nint
Definition Op_Dift_VEF_Face_Gen.tpp:175

AjouterInterneData::nb_faces
int nb_faces
Definition Op_Dift_VEF_Face_Gen.tpp:176

AjouterInterneData::nu
CDoubleArrView nu
Definition Op_Dift_VEF_Face_Gen.tpp:181

AjouterInterneData::resu
DoubleTabView resu
Definition Op_Dift_VEF_Face_Gen.tpp:186

AjouterInterneData::Re
CDoubleTabView3 Re
Definition Op_Dift_VEF_Face_Gen.tpp:182

AjouterInterneData::face_normale
CDoubleTabView face_normale
Definition Op_Dift_VEF_Face_Gen.tpp:180

AjouterInterneData::face_voisins
CIntTabView face_voisins
Definition Op_Dift_VEF_Face_Gen.tpp:179