Skip to content

Commit

Permalink
EBData: New class containing Array4's for all EB data (#4238)
Browse files Browse the repository at this point in the history
This can make the code cleaner because we can get access to all
available EB data in one object. This also reduces many GPU kernels'
register pressure because the GPU device lambdas are much smaller
without the need to capture multiple Array4's. For example, the 3D
EBABecLap's gsrb kernel's number of registers reduces from 198 to 130.

Add a new function that returns a random point on EB for WarpX.
  • Loading branch information
WeiqunZhang authored Dec 6, 2024
1 parent 6aa80df commit 96db0a6
Show file tree
Hide file tree
Showing 9 changed files with 355 additions and 99 deletions.
179 changes: 179 additions & 0 deletions Src/EB/AMReX_EBData.H
Original file line number Diff line number Diff line change
@@ -0,0 +1,179 @@
#ifndef AMREX_EB_DATA_H_
#define AMREX_EB_DATA_H_
#include <AMReX_Config.H>

#include <AMReX_EBCellFlag.H>
#include <AMReX_Random.H>

namespace amrex
{

enum struct EBData_t : int
{
levelset, // level set
volfrac, // volume fraction
centroid, // volume centroid
bndrycent, // boundary centroid
bndrynorm, // boundary normal
bndryarea, // boundary area
AMREX_D_DECL(apx, apy, apz), // area fraction
AMREX_D_DECL(fcx, fcy, fcz), // face centroid
AMREX_D_DECL(ecx, ecy, ecz), // edge centroid
cellflag // EBCellFlag
};

struct EBData
{
template <EBData_t T>
[[nodiscard]] AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
auto get (int i, int j, int k) const noexcept
{
if constexpr (T == EBData_t::cellflag) {
return (*m_cell_flag)(i,j,k);
} else {
return m_real_data[static_cast<int>(T)](i,j,k);
}
}

template <EBData_t T, std::enable_if_t< T == EBData_t::centroid
|| T == EBData_t::bndrycent
|| T == EBData_t::bndrynorm
AMREX_D_TERM(|| T==EBData_t::fcx,
|| T==EBData_t::fcy,
|| T==EBData_t::fcz), int> = 0>
[[nodiscard]] AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
auto get (int i, int j, int k, int n) const noexcept
{
return m_real_data[static_cast<int>(T)](i,j,k,n);
}

[[nodiscard]] AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
GpuArray<Real,AMREX_SPACEDIM>
randomPointOnEB (int i, int j, int k, RandomEngine const& engine) const
{
Real nx = this->get<EBData_t::bndrynorm>(i,j,k,0);
Real ny = this->get<EBData_t::bndrynorm>(i,j,k,1);
Real bcx = this->get<EBData_t::bndrycent>(i,j,k,0);
Real bcy = this->get<EBData_t::bndrycent>(i,j,k,1);
int dir = (std::abs(nx) >= std::abs(ny)) ? 0 : 1;
#if (AMREX_SPACEDIM == 2)
auto f = [&] (Real n0, Real n1, Real bc0, Real bc1)
{
Real rn = amrex::Random(engine);
if (n1 == 0) {
return amrex::makeTuple(bc0, rn-Real(0.5));
} else {
Real nn = n0/n1; // Note that we have n0 >= n1. So nn != 0.
Real ym = bc1+nn*(bc0-Real(-0.5)); // where x=-0.5 and EB intersects
Real yp = bc1+nn*(bc0-Real( 0.5)); // where x= 0.5 and EB intersects
Real ymin = std::min(ym,yp);
Real ymax = std::max(ym,yp);
ymin = std::max(ymin, Real(-0.5));
ymax = std::min(ymax, Real( 0.5));
Real y = rn/(ymax-ymin) + ymin;
Real x = bc0 - (y-bc1)*n1/n0;
return amrex::makeTuple(x,y);
}
};

if (dir == 0) {
auto [x,y] = f( nx, ny,
bcx,bcy);
return GpuArray<Real,2>{x,y};
} else {
auto [y,x] = f( ny, nx,
bcy,bcx);
return GpuArray<Real,2>{x,y};
}
#else
Real nz = this->get<EBData_t::bndrynorm>(i,j,k,2);
Real bcz = this->get<EBData_t::bndrycent>(i,j,k,2);
if (std::abs(nz) > std::abs(nx) && std::abs(nz) > std::abs(ny)) {
dir = 2;
}
auto f = [&] (Real n0, Real n1, Real n2, Real bc0, Real bc1, Real bc2)
{ // Note that n0 >= n1 >= n2;
if (n1 == 0 && n2 == 0) {
return amrex::makeTuple(bc0,
amrex::Random(engine)-Real(0.5),
amrex::Random(engine)-Real(0.5));
} else if (n2 == 0) {
Real nn = n0/n1;
Real ym = bc1+nn*(bc0-Real(-0.5));
Real yp = bc1+nn*(bc0-Real( 0.5));
Real ymin = std::min(ym,yp);
Real ymax = std::max(ym,yp);
ymin = std::max(ymin, Real(-0.5));
ymax = std::min(ymax, Real( 0.5));
Real y = amrex::Random(engine)/(ymax-ymin) + ymin;
Real z = amrex::Random(engine) - Real(0.5);
Real x = bc0 - ((y-bc1)*n1+(z-bc2)*n2)/n0;
return amrex::makeTuple(x,y,z);
} else {
Real y0 = bc1 - ((Real(-0.5)-bc0)*n0+(Real(-0.5)-bc2)*n2)/n1;
Real y1 = bc1 - ((Real( 0.5)-bc0)*n0+(Real(-0.5)-bc2)*n2)/n1;
Real y2 = bc1 - ((Real(-0.5)-bc0)*n0+(Real( 0.5)-bc2)*n2)/n1;
Real y3 = bc1 - ((Real( 0.5)-bc0)*n0+(Real( 0.5)-bc2)*n2)/n1;
Real ymin = std::min({y0,y1,y2,y3});
Real ymax = std::max({y0,y1,y2,y3});
ymin = std::max(ymin, Real(-0.5));
ymax = std::min(ymax, Real( 0.5));
Real z0 = bc2 - ((Real(-0.5)-bc0)*n0+(Real(-0.5)-bc1)*n1)/n2;
Real z1 = bc2 - ((Real( 0.5)-bc0)*n0+(Real(-0.5)-bc1)*n1)/n2;
Real z2 = bc2 - ((Real(-0.5)-bc0)*n0+(Real( 0.5)-bc1)*n1)/n2;
Real z3 = bc2 - ((Real( 0.5)-bc0)*n0+(Real( 0.5)-bc1)*n1)/n2;
Real zmin = std::min({z0,z1,z2,z3});
Real zmax = std::max({z0,z1,z2,z3});
zmin = std::max(zmin, Real(-0.5));
zmax = std::min(zmax, Real( 0.5));
Real x, y, z;
do {
y = amrex::Random(engine)/(ymax-ymin) + ymin;
z = amrex::Random(engine)/(zmax-zmin) + zmin;
x = bc0 - ((y-bc1)*n1+(z-bc2)*n2)/n0;
} while (x > Real(0.5) || x < Real(-0.5));
return amrex::makeTuple(x,y,z);
}
};
if (dir == 0) {
if (std::abs(ny) >= std::abs(nz)) {
auto [x,y,z] = f( nx, ny, nz,
bcx,bcy,bcz);
return GpuArray<Real,3>{x, y, z};
} else {
auto [x,z,y] = f( nx, nz, ny,
bcx,bcz,bcy);
return GpuArray<Real,3>{x, y, z};
}
} else if (dir == 1) {
if (std::abs(nx) >= std::abs(nz)) {
auto [y,x,z] = f( ny, nx, nz,
bcy,bcx,bcz);
return GpuArray<Real,3>{x, y, z};
} else {
auto [y,z,x] = f( ny, nz, nx,
bcy,bcz,bcx);
return GpuArray<Real,3>{x, y, z};
}
} else {
if (std::abs(nx) >= std::abs(ny)) {
auto [z,x,y] = f( nz, nx, ny,
bcz,bcx,bcy);
return GpuArray<Real,3>{x, y, z};
} else {
auto [z,y,x] = f( nz, ny, nx,
bcz,bcy,bcx);
return GpuArray<Real,3>{x, y, z};
}
}
#endif
}

static constexpr int real_data_size = static_cast<int>(EBData_t::cellflag);

Array4<EBCellFlag const> const* m_cell_flag = nullptr;
Array4<Real const> const* m_real_data = nullptr;
};

}
#endif
3 changes: 3 additions & 0 deletions Src/EB/AMReX_EBDataCollection.H
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@

namespace amrex {

class EBFArrayBoxFactory;
template <class T> class FabArray;
class MultiFab;
class iMultiFab;
Expand All @@ -19,6 +20,8 @@ class EBDataCollection
{
public:

friend class EBFArrayBoxFactory;

EBDataCollection (const EB2::Level& a_level, const Geometry& a_geom,
const BoxArray& a_ba, const DistributionMapping& a_dm,
Vector<int> a_ngrow, EBSupport a_support);
Expand Down
5 changes: 5 additions & 0 deletions Src/EB/AMReX_EBFabFactory.H
Original file line number Diff line number Diff line change
Expand Up @@ -4,10 +4,12 @@

#include <AMReX_FabFactory.H>

#include <AMReX_EBData.H>
#include <AMReX_EBDataCollection.H>
#include <AMReX_Geometry.H>
#include <AMReX_EBSupport.H>
#include <AMReX_Array.H>
#include <AMReX_MFIter.H>

namespace amrex
{
Expand Down Expand Up @@ -89,12 +91,15 @@ public:
//! One should use getMultiEBCellFlagFab for normal levels.
[[nodiscard]] iMultiFab const* getCutCellMask () const noexcept { return m_ebdc->getCutCellMask(); }

[[nodiscard]] EBData getEBData (MFIter const& mfi) const noexcept;

private:

EBSupport m_support;
Geometry m_geom;
std::shared_ptr<EBDataCollection> m_ebdc;
EB2::Level const* m_parent = nullptr;
Gpu::DeviceVector<Array4<Real const>> m_eb_data;
};

std::unique_ptr<EBFArrayBoxFactory>
Expand Down
78 changes: 77 additions & 1 deletion Src/EB/AMReX_EBFabFactory.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -20,7 +20,70 @@ EBFArrayBoxFactory::EBFArrayBoxFactory (const EB2::Level& a_level,
m_geom(a_geom),
m_ebdc(std::make_shared<EBDataCollection>(a_level,a_geom,a_ba,a_dm,a_ngrow,a_support)),
m_parent(&a_level)
{}
{
auto const& ebflags = getMultiEBCellFlagFab();
#ifdef AMREX_USE_GPU
m_eb_data.resize(EBData::real_data_size*ebflags.local_size());
Gpu::PinnedVector<Array4<Real const>> eb_data_hv;
#else
auto& eb_data_hv = m_eb_data;
#endif

eb_data_hv.reserve(EBData::real_data_size*ebflags.local_size());

for (MFIter mfi(ebflags,MFItInfo{}.DisableDeviceSync()); mfi.isValid(); ++mfi) {
Array4<Real const> a{};

bool cutfab_is_ok = ebflags[mfi].getType() == FabType::singlevalued;

a = ( m_ebdc->m_levelset )
? m_ebdc->m_levelset->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);

a = ( m_ebdc->m_volfrac )
? m_ebdc->m_volfrac->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);

a = ( m_ebdc->m_centroid && cutfab_is_ok )
? m_ebdc->m_centroid->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);

a = ( m_ebdc->m_bndrycent && cutfab_is_ok )
? m_ebdc->m_bndrycent->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);

a = ( m_ebdc->m_bndrynorm && cutfab_is_ok )
? m_ebdc->m_bndrynorm->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);

a = ( m_ebdc->m_bndryarea && cutfab_is_ok )
? m_ebdc->m_bndryarea->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);

for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
a = ( m_ebdc->m_areafrac[idim] && cutfab_is_ok )
? m_ebdc->m_areafrac[idim]->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);
}

for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
a = ( m_ebdc->m_facecent[idim] && cutfab_is_ok )
? m_ebdc->m_facecent[idim]->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);
}

for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
a = ( m_ebdc->m_edgecent[idim] && cutfab_is_ok )
? m_ebdc->m_edgecent[idim]->const_array(mfi) : Array4<Real const>{};
eb_data_hv.push_back(a);
}
}

#ifdef AMREX_USE_GPU
Gpu::copyAsync(Gpu::hostToDevice, eb_data_hv.begin(), eb_data_hv.end(), m_eb_data.begin());
Gpu::streamSynchronize();
#endif
}

AMREX_NODISCARD
FArrayBox*
Expand Down Expand Up @@ -115,6 +178,19 @@ EBFArrayBoxFactory::hasEBInfo () const noexcept
return m_parent->hasEBInfo();
}

EBData
EBFArrayBoxFactory::getEBData (MFIter const& mfi) const noexcept
{
int const li = mfi.LocalIndex();
auto const& ebflags_ma = this->getMultiEBCellFlagFab().const_arrays();
#ifdef AMREX_USE_GPU
auto const* pebflag = ebflags_ma.dp + li;
#else
auto const* pebflag = ebflags_ma.hp + li;
#endif
return EBData{pebflag, m_eb_data.data()+EBData::real_data_size*li};
}

std::unique_ptr<EBFArrayBoxFactory>
makeEBFabFactory (const Geometry& a_geom,
const BoxArray& a_ba,
Expand Down
1 change: 1 addition & 0 deletions Src/EB/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -20,6 +20,7 @@ foreach(D IN LISTS AMReX_SPACEDIM)
AMReX_EBMultiFabUtil.cpp
AMReX_EBCellFlag.H
AMReX_EBCellFlag.cpp
AMReX_EBData.H
AMReX_EBDataCollection.H
AMReX_EBDataCollection.cpp
AMReX_MultiCutFab.H
Expand Down
2 changes: 2 additions & 0 deletions Src/EB/Make.package
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@ CEXE_sources += AMReX_EBMultiFabUtil.cpp
CEXE_headers += AMReX_EBCellFlag.H
CEXE_sources += AMReX_EBCellFlag.cpp

CEXE_headers += AMReX_EBData.H

CEXE_headers += AMReX_EBDataCollection.H
CEXE_sources += AMReX_EBDataCollection.cpp

Expand Down
Loading

0 comments on commit 96db0a6

Please sign in to comment.