Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

dealii - remove duplicate GPU vec allocations #1652

Merged
merged 2 commits into from
Aug 30, 2024
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
84 changes: 61 additions & 23 deletions examples/deal.II/bps.h
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,8 @@
#include <deal.II/matrix_free/tools.h>

// libCEED includes
#include <ceed/ceed.h>
#include <ceed.h>
#include <ceed/backend.h>

// QFunction source
#include "bps-qfunctions.h"
Expand Down Expand Up @@ -160,6 +161,8 @@ class OperatorCeed : public OperatorBase<Number>
*/
~OperatorCeed()
{
CeedVectorDestroy(&src_ceed);
CeedVectorDestroy(&dst_ceed);
CeedOperatorDestroy(&op_apply);
CeedDestroy(&ceed);
}
Expand Down Expand Up @@ -302,7 +305,11 @@ class OperatorCeed : public OperatorBase<Number>
CeedOperatorSetField(op_apply, "qdata", q_data_restriction, CEED_BASIS_NONE, q_data);
CeedOperatorSetField(op_apply, "v", sol_restriction, sol_basis, CEED_VECTOR_ACTIVE);

// 7) cleanup
// 7) libCEED vectors
CeedElemRestrictionCreateVector(sol_restriction, &src_ceed, NULL);
CeedElemRestrictionCreateVector(sol_restriction, &dst_ceed, NULL);

// 8) cleanup
CeedVectorDestroy(&q_data);
CeedElemRestrictionDestroy(&q_data_restriction);
CeedElemRestrictionDestroy(&sol_restriction);
Expand All @@ -322,30 +329,43 @@ class OperatorCeed : public OperatorBase<Number>

if (dof_handler.get_fe().n_components() == 1)
{
// create libCEED view on deal.II vectors
VectorTypeCeed src_ceed(ceed, src);
VectorTypeCeed dst_ceed(ceed, dst);
// pass memory buffers to libCEED
VectorTypeCeed x(src_ceed);
VectorTypeCeed y(dst_ceed);
x.set_array(src);
y.set_array(dst);

// apply operator
CeedOperatorApply(op_apply, src_ceed(), dst_ceed(), CEED_REQUEST_IMMEDIATE);
CeedOperatorApply(op_apply, x(), y(), CEED_REQUEST_IMMEDIATE);

// pull arrays back to deal.II
x.sync_to_host();
y.sync_to_host();
jeremylt marked this conversation as resolved.
Show resolved Hide resolved
}
else // TODO: needed for multiple components
{
// allocate space for block vectors
src_tmp.reinit(this->extended_local_size(), true);
dst_tmp.reinit(this->extended_local_size(), true);

copy_to_block_vector(src_tmp, src); // copy to block vector
// copy to block vector
copy_to_block_vector(src_tmp, src);

// create libCEED view on deal.II vectors
VectorTypeCeed src_ceed(ceed, src_tmp);
VectorTypeCeed dst_ceed(ceed, dst_tmp);
// pass memory buffers to libCEED
VectorTypeCeed x(src_ceed);
VectorTypeCeed y(dst_ceed);
x.set_array(src_tmp);
y.set_array(dst_tmp);

// apply operator
CeedOperatorApply(op_apply, src_ceed(), dst_ceed(), CEED_REQUEST_IMMEDIATE);
CeedOperatorApply(op_apply, x(), y(), CEED_REQUEST_IMMEDIATE);

dst_ceed.sync_to_host(); // pull libCEED data back to host
copy_from_block_vector(dst, dst_tmp); // copy from block vector
// pull arrays back to deal.II
x.sync_to_host();
y.sync_to_host();

// copy from block vector
copy_from_block_vector(dst, dst_tmp);
}

// communicate: compress
Expand Down Expand Up @@ -373,9 +393,14 @@ class OperatorCeed : public OperatorBase<Number>
{
this->initialize_dof_vector(diagonal);

VectorTypeCeed diagonal_ceed(ceed, diagonal);
// pass memory buffer to libCEED
VectorTypeCeed y(dst_ceed);
y.set_array(diagonal);

CeedOperatorLinearAssembleDiagonal(op_apply, y(), CEED_REQUEST_IMMEDIATE);

CeedOperatorLinearAssembleDiagonal(op_apply, diagonal_ceed(), CEED_REQUEST_IMMEDIATE);
// pull array back to deal.II
y.sync_to_host();

const unsigned int n_components = dof_handler.get_fe().n_components();

Expand Down Expand Up @@ -404,13 +429,10 @@ class OperatorCeed : public OperatorBase<Number>
/**
* Constructor.
*/
VectorTypeCeed(const Ceed &ceed, const VectorType &vec)
VectorTypeCeed(const CeedVector &vec_orig)
{
const unsigned int n_dofs =
vec.get_partitioner()->locally_owned_size() + vec.get_partitioner()->n_ghost_indices();

CeedVectorCreate(ceed, n_dofs, &vec_ceed);
CeedVectorSetArray(vec_ceed, CEED_MEM_HOST, CEED_USE_POINTER, vec.get_values());
vec_ceed = NULL;
CeedVectorReferenceCopy(vec_orig, &vec_ceed);
}

/**
Expand All @@ -422,6 +444,15 @@ class OperatorCeed : public OperatorBase<Number>
return vec_ceed;
}

/**
* Set deal.II memory in libCEED vector.
*/
void
set_array(const VectorType &vec)
{
CeedVectorSetArray(vec_ceed, CEED_MEM_HOST, CEED_USE_POINTER, vec.get_values());
}

/**
* Sync memory from device to host.
*/
Expand All @@ -436,8 +467,13 @@ class OperatorCeed : public OperatorBase<Number>
*/
~VectorTypeCeed()
{
CeedScalar *ptr;
CeedVectorTakeArray(vec_ceed, CEED_MEM_HOST, &ptr);
bool has_array;
CeedVectorHasBorrowedArrayOfType(vec_ceed, CEED_MEM_HOST, &has_array);
if (has_array)
{
CeedScalar *ptr;
CeedVectorTakeArray(vec_ceed, CEED_MEM_HOST, &ptr);
}
CeedVectorDestroy(&vec_ceed);
}

Expand Down Expand Up @@ -705,6 +741,8 @@ class OperatorCeed : public OperatorBase<Number>
Ceed ceed;
std::vector<double> weights;
std::array<CeedInt, 3> strides;
CeedVector src_ceed;
CeedVector dst_ceed;
CeedOperator op_apply;

/**
Expand Down