-
Notifications
You must be signed in to change notification settings - Fork 50
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Global particle redistribution based on the grid
- Loading branch information
Showing
5 changed files
with
559 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,327 @@ | ||
/**************************************************************************** | ||
* Copyright (c) 2018-2023 by the Cabana authors * | ||
* All rights reserved. * | ||
* * | ||
* This file is part of the Cabana library. Cabana is distributed under a * | ||
* BSD 3-clause license. For the licensing terms see the LICENSE file in * | ||
* the top-level directory. * | ||
* * | ||
* SPDX-License-Identifier: BSD-3-Clause * | ||
****************************************************************************/ | ||
|
||
/*! | ||
\file Cabana_Grid_GlobalParticleComm.hpp | ||
\brief Global particle communication. | ||
*/ | ||
#ifndef CABANA_GRID_GLOBALPARTICLECOMM_HPP | ||
#define CABANA_GRID_GLOBALPARTICLECOMM_HPP | ||
|
||
#include <Cabana_Grid_LocalMesh.hpp> | ||
#include <Cabana_Grid_Types.hpp> | ||
|
||
#include <Cabana_Distributor.hpp> | ||
#include <Cabana_Slice.hpp> | ||
|
||
#include <memory> | ||
#include <stdexcept> | ||
#include <type_traits> | ||
|
||
namespace Cabana | ||
{ | ||
namespace Grid | ||
{ | ||
//---------------------------------------------------------------------------// | ||
/*! | ||
\brief Global particle communication based on the background grid. | ||
*/ | ||
template <class MemorySpace, class LocalGridType> | ||
class GlobalParticleComm | ||
{ | ||
public: | ||
//! Spatial dimension. | ||
static constexpr std::size_t num_space_dim = LocalGridType::num_space_dim; | ||
//! Mesh type. | ||
using mesh_type = typename LocalGridType::mesh_type; | ||
//! Global grid. | ||
using global_grid_type = Cabana::Grid::GlobalGrid<mesh_type>; | ||
//! Kokkos memory space. | ||
using memory_space = MemorySpace; | ||
|
||
//! Local boundary View type. | ||
using corner_view_type = | ||
Kokkos::View<double* [num_space_dim][2], memory_space>; | ||
//! Particle destination ranks View type. | ||
using destination_view_type = Kokkos::View<int*, memory_space>; | ||
//! Cartesian rank View type. | ||
using rank_view_type = Kokkos::View<int***, memory_space>; | ||
//! Cartesian rank View type (host). | ||
using host_rank_view_type = Kokkos::View<int***, Kokkos::HostSpace>; | ||
|
||
//! \brief Constructor. | ||
GlobalParticleComm( const LocalGridType local_grid ) | ||
{ | ||
auto global_grid = local_grid.globalGrid(); | ||
_destinations = destination_view_type( | ||
Kokkos::ViewAllocateWithoutInitializing( "global_destination" ), | ||
0 ); | ||
|
||
int max_ranks_per_dim = -1; | ||
for ( std::size_t d = 0; d < num_space_dim; ++d ) | ||
{ | ||
_ranks_per_dim[d] = global_grid.dimNumBlock( d ); | ||
if ( _ranks_per_dim[d] > max_ranks_per_dim ) | ||
max_ranks_per_dim = _ranks_per_dim[d]; | ||
} | ||
copyRanks( global_grid ); | ||
|
||
// Purposely using zero-init. Some entries unused in non-cubic | ||
// decompositions. | ||
_local_corners = | ||
corner_view_type( "local_mpi_boundaries", max_ranks_per_dim ); | ||
|
||
_rank_1d = global_grid.blockId(); | ||
for ( std::size_t d = 0; d < num_space_dim; ++d ) | ||
_rank[d] = global_grid.dimBlockId( d ); | ||
|
||
auto local_mesh = createLocalMesh<memory_space>( local_grid ); | ||
storeRanks( local_mesh ); | ||
|
||
// Update local boundaries from all ranks. | ||
auto comm = global_grid.comm(); | ||
// TODO: Could use subcommunicators instead. | ||
MPI_Allreduce( MPI_IN_PLACE, _local_corners.data(), | ||
_local_corners.size(), MPI_DOUBLE, MPI_SUM, comm ); | ||
|
||
scaleRanks(); | ||
} | ||
|
||
//! Store local rank boundaries from the local mesh. | ||
template <class LocalMeshType> | ||
void storeRanks( LocalMeshType local_mesh ) | ||
{ | ||
auto store_corners = KOKKOS_CLASS_LAMBDA( const std::size_t d ) | ||
{ | ||
_local_corners( _rank[d], d, 0 ) = | ||
local_mesh.lowCorner( Cabana::Grid::Own(), d ); | ||
_local_corners( _rank[d], d, 1 ) = | ||
local_mesh.highCorner( Cabana::Grid::Own(), d ); | ||
}; | ||
using exec_space = typename memory_space::execution_space; | ||
Kokkos::RangePolicy<exec_space> policy( 0, num_space_dim ); | ||
Kokkos::parallel_for( "Cabana::Grid::GlobalParticleComm::storeCorners", | ||
policy, store_corners ); | ||
Kokkos::fence(); | ||
} | ||
|
||
//! Scale local rank boundaries based on double counting from MPI reduction. | ||
void scaleRanks() | ||
{ | ||
auto scale = getScaling(); | ||
|
||
auto scale_corners = KOKKOS_CLASS_LAMBDA( const std::size_t d ) | ||
{ | ||
for ( int r = 0; r < _ranks_per_dim[d]; ++r ) | ||
{ | ||
_local_corners( r, d, 0 ) /= scale[d]; | ||
_local_corners( r, d, 1 ) /= scale[d]; | ||
} | ||
}; | ||
using exec_space = typename memory_space::execution_space; | ||
Kokkos::RangePolicy<exec_space> policy( 0, num_space_dim ); | ||
Kokkos::parallel_for( "Cabana::Grid::GlobalParticleComm::scaleCorners", | ||
policy, scale_corners ); | ||
Kokkos::fence(); | ||
} | ||
|
||
template <std::size_t NSD = num_space_dim> | ||
std::enable_if_t<3 == NSD, Kokkos::Array<int, num_space_dim>> getScaling() | ||
{ | ||
Kokkos::Array<int, num_space_dim> scale; | ||
scale[0] = _ranks_per_dim[1] * _ranks_per_dim[2]; | ||
scale[1] = _ranks_per_dim[0] * _ranks_per_dim[2]; | ||
scale[2] = _ranks_per_dim[0] * _ranks_per_dim[1]; | ||
return scale; | ||
} | ||
|
||
template <std::size_t NSD = num_space_dim> | ||
std::enable_if_t<2 == NSD, Kokkos::Array<int, num_space_dim>> getScaling() | ||
{ | ||
Kokkos::Array<int, num_space_dim> scale; | ||
scale[0] = _ranks_per_dim[1]; | ||
scale[1] = _ranks_per_dim[0]; | ||
return scale; | ||
} | ||
|
||
//! Store all cartesian MPI ranks. | ||
template <class GlobalGridType, std::size_t NSD = num_space_dim> | ||
std::enable_if_t<3 == NSD, void> copyRanks( GlobalGridType global_grid ) | ||
{ | ||
host_rank_view_type global_ranks_host( | ||
Kokkos::ViewAllocateWithoutInitializing( "ranks_host" ), | ||
_ranks_per_dim[0], _ranks_per_dim[1], _ranks_per_dim[2] ); | ||
for ( int i = 0; i < _ranks_per_dim[0]; ++i ) | ||
for ( int j = 0; j < _ranks_per_dim[1]; ++j ) | ||
for ( int k = 0; k < _ranks_per_dim[2]; ++k ) | ||
// Not device accessible (uses MPI), so must be copied. | ||
global_ranks_host( i, j, k ) = | ||
global_grid.blockRank( i, j, k ); | ||
|
||
_global_ranks = Kokkos::create_mirror_view_and_copy( | ||
memory_space(), global_ranks_host ); | ||
} | ||
|
||
//! Store all cartesian MPI ranks. | ||
template <class GlobalGridType, std::size_t NSD = num_space_dim> | ||
std::enable_if_t<2 == NSD, void> copyRanks( GlobalGridType global_grid ) | ||
{ | ||
// Storing as 3d for convenience. | ||
host_rank_view_type global_ranks_host( | ||
Kokkos::ViewAllocateWithoutInitializing( "ranks_host" ), | ||
_ranks_per_dim[0], _ranks_per_dim[1], 1 ); | ||
for ( int i = 0; i < _ranks_per_dim[0]; ++i ) | ||
for ( int j = 0; j < _ranks_per_dim[1]; ++j ) | ||
// Not device accessible (uses MPI), so must be copied. | ||
global_ranks_host( i, j, 0 ) = global_grid.blockRank( i, j ); | ||
|
||
_global_ranks = Kokkos::create_mirror_view_and_copy( | ||
memory_space(), global_ranks_host ); | ||
} | ||
|
||
//! Get the MPI rank. | ||
template <std::size_t NSD = num_space_dim> | ||
KOKKOS_INLINE_FUNCTION std::enable_if_t<3 == NSD, int> | ||
getRank( int ijk[num_space_dim] ) const | ||
{ | ||
return _global_ranks( ijk[0], ijk[1], ijk[2] ); | ||
} | ||
|
||
//! Get the MPI rank. | ||
template <std::size_t NSD = num_space_dim> | ||
KOKKOS_INLINE_FUNCTION std::enable_if_t<2 == NSD, int> | ||
getRank( int ijk[num_space_dim] ) const | ||
{ | ||
return _global_ranks( ijk[0], ijk[1], 0 ); | ||
} | ||
|
||
/*! | ||
\brief Bin particles across the global grid. | ||
Because of MPI partitioning, this is not a perfect grid (as the Core | ||
LinkedCellList is), so we use binary search instead of direct 3d->1d | ||
indexing. | ||
*/ | ||
template <class ExecutionSpace, class PositionType> | ||
void build( ExecutionSpace exec_space, PositionType positions, | ||
const std::size_t begin, const std::size_t end ) | ||
{ | ||
Kokkos::Profiling::pushRegion( | ||
"Cabana::Grid::GlobalParticleComm::build" ); | ||
|
||
static_assert( is_accessible_from<memory_space, ExecutionSpace>{}, "" ); | ||
assert( end >= begin ); | ||
assert( end <= positions.size() ); | ||
|
||
// Must match the size of all particles, even if some can be ignored in | ||
// this search. | ||
Kokkos::resize( _destinations, positions.size() ); | ||
// Start with everything staying on this rank. | ||
Kokkos::deep_copy( _destinations, _rank_1d ); | ||
|
||
// Local copies for lambda capture. | ||
auto local_corners = _local_corners; | ||
auto ranks_per_dim = _ranks_per_dim; | ||
auto destinations = _destinations; | ||
auto build_migrate = KOKKOS_CLASS_LAMBDA( const std::size_t p ) | ||
{ | ||
int ijk[num_space_dim]; | ||
|
||
// Find the rank this particle should be moved to. | ||
for ( std::size_t d = 0; d < num_space_dim; ++d ) | ||
{ | ||
int min = 0; | ||
int max = ranks_per_dim[d]; | ||
|
||
// Check if outside the box in this dimension. | ||
if ( ( positions( p, d ) < local_corners( min, d, 0 ) ) || | ||
( positions( p, d ) > local_corners( max - 1, d, 1 ) ) ) | ||
destinations( p ) = -1; | ||
|
||
// Do a binary search for this particle in this dimension. | ||
while ( max - min > 1 ) | ||
{ | ||
int center = Kokkos::floor( ( max + min ) / 2.0 ); | ||
if ( positions( p, d ) < local_corners( center, d, 0 ) ) | ||
max = center; | ||
else | ||
min = center; | ||
} | ||
ijk[d] = min; | ||
} | ||
// Keep the destination rank for eventual migration. | ||
destinations( p ) = getRank( ijk ); | ||
}; | ||
|
||
Kokkos::RangePolicy<ExecutionSpace> policy( exec_space, begin, end ); | ||
Kokkos::parallel_for( "Cabana::Grid::GlobalParticleComm::build", policy, | ||
build_migrate ); | ||
Kokkos::fence(); | ||
|
||
Kokkos::Profiling::popRegion(); | ||
} | ||
|
||
//! Bin particles across the global grid. | ||
template <class ExecutionSpace, class PositionType> | ||
void build( ExecutionSpace exec_space, PositionType positions ) | ||
{ | ||
build( exec_space, positions, 0, positions.size() ); | ||
} | ||
|
||
//! Bin particles across the global grid. | ||
template <class PositionType> | ||
void build( PositionType positions ) | ||
{ | ||
using execution_space = typename memory_space::execution_space; | ||
// TODO: enable views. | ||
build( execution_space{}, positions, 0, positions.size() ); | ||
} | ||
|
||
//! Migrate particles to the correct rank. | ||
template <class AoSoAType> | ||
void migrate( MPI_Comm comm, AoSoAType& aosoa ) | ||
{ | ||
Cabana::Distributor<memory_space> distributor( comm, _destinations ); | ||
Cabana::migrate( distributor, aosoa ); | ||
} | ||
|
||
protected: | ||
//! Current rank. | ||
int _rank_1d; | ||
//! Current cartesian rank. | ||
Kokkos::Array<int, num_space_dim> _rank; | ||
//! Total ranks per dimension. | ||
Kokkos::Array<int, num_space_dim> _ranks_per_dim; | ||
//! Local boundaries. | ||
corner_view_type _local_corners; | ||
//! All cartesian ranks. | ||
rank_view_type _global_ranks; | ||
//! Particle destination ranks. | ||
destination_view_type _destinations; | ||
}; | ||
|
||
/*! | ||
\brief Create global linked cell binning. | ||
\return Shared pointer to a GlobalParticleComm. | ||
*/ | ||
template <class MemorySpace, class LocalGridType> | ||
auto createGlobalParticleComm( const LocalGridType& local_grid ) | ||
{ | ||
return std::make_shared<GlobalParticleComm<MemorySpace, LocalGridType>>( | ||
local_grid ); | ||
} | ||
|
||
//---------------------------------------------------------------------------// | ||
|
||
} // namespace Grid | ||
} // namespace Cabana | ||
|
||
#endif // end CABANA_GRID_GLOBALPARTICLECOMM_HPP |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -20,6 +20,7 @@ set(SERIAL_TESTS | |
|
||
set(MPI_TESTS | ||
GlobalGrid | ||
GlobalParticleComm | ||
LocalGrid | ||
IndexConversion | ||
LocalMesh3d | ||
|
Oops, something went wrong.