From a70fd5adb34125922fec35da87dc51c5f56fc855 Mon Sep 17 00:00:00 2001 From: Sam Reeve <6740307+streeve@users.noreply.github.com> Date: Thu, 25 May 2023 23:28:21 -0400 Subject: [PATCH] Fuse boundary kernel --- .../finite_difference/finite_difference.cpp | 38 ++++++++++++------- 1 file changed, 25 insertions(+), 13 deletions(-) diff --git a/example/methods/finite_difference/finite_difference.cpp b/example/methods/finite_difference/finite_difference.cpp index 60ba98a0a..50dd53f32 100644 --- a/example/methods/finite_difference/finite_difference.cpp +++ b/example/methods/finite_difference/finite_difference.cpp @@ -18,32 +18,44 @@ #include +// Apply boundary conditions. For simplicity of the code, rebuild the index +// spaces each step even though it's a fixed geometry. Apply all boundaries in +// one kernel for performance. template void updateBoundaries( ExecutionSpace exec_space, LocalGridType local_grid, ArrayType& field ) { - // Update the boundary on each face of the cube. + // Create boundary indices for each plane. + Kokkos::Array, 6> boundary_spaces; + // Store the boundary details in device-accessible fixed-size arrays. + Kokkos::Array, 6> planes; + // Generate the boundary condition index spaces. + int count = 0; for ( int d = 0; d < 3; d++ ) { for ( int dir = -1; dir < 2; dir += 2 ) { - std::array plane = { 0, 0, 0 }; - plane[d] = dir; + planes[count] = { 0, 0, 0 }; + planes[count][d] = dir; // Get the boundary indices for this plane (each one is a separate, // contiguous index space). - auto boundary_space = local_grid->boundaryIndexSpace( - Cabana::Grid::Own(), Cabana::Grid::Cell(), plane ); - - Cabana::Grid::grid_parallel_for( - "boundary_update", exec_space, boundary_space, - KOKKOS_LAMBDA( const int i, const int j, const int k ) { - // Neumann boundary condition example - field( i, j, k, 0 ) = - field( i - plane[0], j - plane[1], k - plane[2], 0 ); - } ); + boundary_spaces[count] = local_grid->boundaryIndexSpace( + Cabana::Grid::Own(), Cabana::Grid::Cell(), planes[count][0], + planes[count][1], planes[count][2] ); + count++; } } + + // Update the boundary on each face of the cube. Pass the vector of index + // spaces to avoid launching 6 separate kernels. + Cajita::grid_parallel_for( + "boundary_update", exec_space, boundary_spaces, + KOKKOS_LAMBDA( const int b, const int i, const int j, const int k ) { + // Set boundary cells to the nearest internal value. + field( i, j, k, 0 ) = field( i - planes[b][0], j - planes[b][1], + k - planes[b][2], 0 ); + } ); } /*