From 7016e0bef12f3539a80766c2e714cbf74ec4d29d Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Mon, 4 Apr 2022 16:11:38 -0600 Subject: [PATCH 01/10] WIP multiprecision vectors: Change Vector read/write/set backend functions to generic version with precision parameter --- backends/cuda-ref/ceed-cuda-vector.c | 77 ++++--- backends/hip-ref/ceed-hip-ref-vector.c | 75 ++++--- backends/ref/ceed-ref-vector.c | 77 ++++--- include/ceed-impl.h | 20 +- include/ceed/backend.h | 19 +- interface/ceed-vector.c | 292 ++++++++++++++++++++----- interface/ceed.c | 14 +- 7 files changed, 398 insertions(+), 176 deletions(-) diff --git a/backends/cuda-ref/ceed-cuda-vector.c b/backends/cuda-ref/ceed-cuda-vector.c index bb373dd037..5ed7229ae1 100644 --- a/backends/cuda-ref/ceed-cuda-vector.c +++ b/backends/cuda-ref/ceed-cuda-vector.c @@ -88,8 +88,9 @@ static inline int CeedVectorSyncD2H_Cuda(const CeedVector vec) { //------------------------------------------------------------------------------ // Sync arrays //------------------------------------------------------------------------------ -static inline int CeedVectorSync_Cuda(const CeedVector vec, - CeedMemType mem_type) { +static inline int CeedVectorSyncGeneric_Cuda(const CeedVector vec, + CeedScalarType prec, + CeedMemType mem_type) { switch (mem_type) { case CEED_MEM_HOST: return CeedVectorSyncD2H_Cuda(vec); case CEED_MEM_DEVICE: return CeedVectorSyncH2D_Cuda(vec); @@ -150,7 +151,8 @@ static inline int CeedVectorHasArrayOfType_Cuda(const CeedVector vec, // Check if has borrowed array of given type //------------------------------------------------------------------------------ static inline int CeedVectorHasBorrowedArrayOfType_Cuda(const CeedVector vec, - CeedMemType mem_type, bool *has_borrowed_array_of_type) { + CeedMemType mem_type, CeedScalarType prec, + bool *has_borrowed_array_of_type) { int ierr; CeedVector_Cuda *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -194,7 +196,7 @@ static inline int CeedVectorNeedSync_Cuda(const CeedVector vec, // Set array from host //------------------------------------------------------------------------------ static int CeedVectorSetArrayHost_Cuda(const CeedVector vec, - const CeedCopyMode copy_mode, CeedScalar *array) { + const CeedCopyMode copy_mode, void *array) { int ierr; CeedVector_Cuda *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -236,7 +238,7 @@ static int CeedVectorSetArrayHost_Cuda(const CeedVector vec, // Set array from device //------------------------------------------------------------------------------ static int CeedVectorSetArrayDevice_Cuda(const CeedVector vec, - const CeedCopyMode copy_mode, CeedScalar *array) { + const CeedCopyMode copy_mode, void *array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -280,9 +282,11 @@ static int CeedVectorSetArrayDevice_Cuda(const CeedVector vec, // Set the array used by a vector, // freeing any previously allocated array if applicable //------------------------------------------------------------------------------ -static int CeedVectorSetArray_Cuda(const CeedVector vec, - const CeedMemType mem_type, - const CeedCopyMode copy_mode, CeedScalar *array) { +static int CeedVectorSetArrayGeneric_Cuda(const CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType prec, + const CeedCopyMode copy_mode, + void *array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -359,8 +363,8 @@ static int CeedVectorSetValue_Cuda(CeedVector vec, CeedScalar val) { //------------------------------------------------------------------------------ // Vector Take Array //------------------------------------------------------------------------------ -static int CeedVectorTakeArray_Cuda(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { +static int CeedVectorTakeArrayGeneric_Cuda(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -396,7 +400,9 @@ static int CeedVectorTakeArray_Cuda(CeedVector vec, CeedMemType mem_type, // If a different memory type is most up to date, this will perform a copy //------------------------------------------------------------------------------ static int CeedVectorGetArrayCore_Cuda(const CeedVector vec, - const CeedMemType mem_type, CeedScalar **array) { + const CeedMemType mem_type, + const CeedScalarType prec, + void **array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -427,21 +433,26 @@ static int CeedVectorGetArrayCore_Cuda(const CeedVector vec, //------------------------------------------------------------------------------ // Get read-only access to a vector via the specified mem_type //------------------------------------------------------------------------------ -static int CeedVectorGetArrayRead_Cuda(const CeedVector vec, - const CeedMemType mem_type, const CeedScalar **array) { - return CeedVectorGetArrayCore_Cuda(vec, mem_type, (CeedScalar **)array); +static int CeedVectorGetArrayReadGeneric_Cuda(const CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType prec, + const void **array) { + return CeedVectorGetArrayCore_Cuda(vec, mem_type, prec, (void **)array); } //------------------------------------------------------------------------------ -// Get read/write access to a vector via the specified mem_type +// Get read/write access to a vector via the specified mem_type and precision //------------------------------------------------------------------------------ static int CeedVectorGetArray_Cuda(const CeedVector vec, - const CeedMemType mem_type, CeedScalar **array) { + const CeedMemType mem_type, + const CeedScalarType prec, + void **array) { int ierr; CeedVector_Cuda *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - ierr = CeedVectorGetArrayCore_Cuda(vec, mem_type, array); CeedChkBackend(ierr); + ierr = CeedVectorGetArrayCore_Cuda(vec, mem_type, prec, array); + CeedChkBackend(ierr); ierr = CeedVectorSetAllInvalid_Cuda(vec); CeedChkBackend(ierr); switch (mem_type) { @@ -457,10 +468,12 @@ static int CeedVectorGetArray_Cuda(const CeedVector vec, } //------------------------------------------------------------------------------ -// Get write access to a vector via the specified mem_type +// Get write access to a vector via the specified mem_type and precision //------------------------------------------------------------------------------ -static int CeedVectorGetArrayWrite_Cuda(const CeedVector vec, - const CeedMemType mem_type, CeedScalar **array) { +static int CeedVectorGetArrayWriteGeneric_Cuda(const CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType prec, + void **array) { int ierr; CeedVector_Cuda *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -470,7 +483,7 @@ static int CeedVectorGetArrayWrite_Cuda(const CeedVector vec, CeedChkBackend(ierr); if (!has_array_of_type) { // Allocate if array is not yet allocated - ierr = CeedVectorSetArray(vec, mem_type, CEED_COPY_VALUES, NULL); + ierr = CeedVectorSetArrayGeneric(vec, mem_type, prec, CEED_COPY_VALUES, NULL); CeedChkBackend(ierr); } else { // Select dirty array @@ -489,7 +502,7 @@ static int CeedVectorGetArrayWrite_Cuda(const CeedVector vec, } } - return CeedVectorGetArray_Cuda(vec, mem_type, array); + return CeedVectorGetArrayGeneric_Cuda(vec, mem_type, prec, array); } //------------------------------------------------------------------------------ @@ -756,19 +769,19 @@ int CeedVectorCreate_Cuda(CeedSize n, CeedVector vec) { ierr = CeedSetBackendFunction(ceed, "Vector", vec, "HasBorrowedArrayOfType", CeedVectorHasBorrowedArrayOfType_Cuda); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetArray", - CeedVectorSetArray_Cuda); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "TakeArray", - CeedVectorTakeArray_Cuda); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetArrayGeneric", + CeedVectorSetArrayGeneric_Cuda); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "TakeArrayGeneric", + CeedVectorTakeArrayGeneric_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetValue", (int (*)())(CeedVectorSetValue_Cuda)); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArray", - CeedVectorGetArray_Cuda); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayRead", - CeedVectorGetArrayRead_Cuda); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayWrite", - CeedVectorGetArrayWrite_Cuda); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayGeneric", + CeedVectorGetArrayGeneric_Cuda); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayReadGeneric", + CeedVectorGetArrayReadGeneric_Cuda); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayWriteGeneric", + CeedVectorGetArrayWriteGeneric_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "Norm", CeedVectorNorm_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "Reciprocal", diff --git a/backends/hip-ref/ceed-hip-ref-vector.c b/backends/hip-ref/ceed-hip-ref-vector.c index b8371225cb..a485c6ff2b 100644 --- a/backends/hip-ref/ceed-hip-ref-vector.c +++ b/backends/hip-ref/ceed-hip-ref-vector.c @@ -150,7 +150,8 @@ static inline int CeedVectorHasArrayOfType_Hip(const CeedVector vec, // Check if has borrowed array of given type //------------------------------------------------------------------------------ static inline int CeedVectorHasBorrowedArrayOfType_Hip(const CeedVector vec, - CeedMemType mem_type, bool *has_borrowed_array_of_type) { + CeedMemType mem_type, CeedScalarType prec, + bool *has_borrowed_array_of_type) { int ierr; CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -194,7 +195,7 @@ static inline int CeedVectorNeedSync_Hip(const CeedVector vec, // Set array from host //------------------------------------------------------------------------------ static int CeedVectorSetArrayHost_Hip(const CeedVector vec, - const CeedCopyMode copy_mode, CeedScalar *array) { + const CeedCopyMode copy_mode, void *array) { int ierr; CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -235,7 +236,7 @@ static int CeedVectorSetArrayHost_Hip(const CeedVector vec, // Set array from device //------------------------------------------------------------------------------ static int CeedVectorSetArrayDevice_Hip(const CeedVector vec, - const CeedCopyMode copy_mode, CeedScalar *array) { + const CeedCopyMode copy_mode, void *array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -279,9 +280,10 @@ static int CeedVectorSetArrayDevice_Hip(const CeedVector vec, // Set the array used by a vector, // freeing any previously allocated array if applicable //------------------------------------------------------------------------------ -static int CeedVectorSetArray_Hip(const CeedVector vec, - const CeedMemType mem_type, - const CeedCopyMode copy_mode, CeedScalar *array) { +static int CeedVectorSetArrayGeneric_Hip(const CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType prec, + const CeedCopyMode copy_mode, void *array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -354,8 +356,9 @@ static int CeedVectorSetValue_Hip(CeedVector vec, CeedScalar val) { //------------------------------------------------------------------------------ // Vector Take Array //------------------------------------------------------------------------------ -static int CeedVectorTakeArray_Hip(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { +static int CeedVectorTakeArrayGeneric_Hip(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, + void **array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -391,7 +394,9 @@ static int CeedVectorTakeArray_Hip(CeedVector vec, CeedMemType mem_type, // If a different memory type is most up to date, this will perform a copy //------------------------------------------------------------------------------ static int CeedVectorGetArrayCore_Hip(const CeedVector vec, - const CeedMemType mem_type, CeedScalar **array) { + const CeedMemType mem_type, + const CeedScalarType prec, + void **array) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -420,24 +425,28 @@ static int CeedVectorGetArrayCore_Hip(const CeedVector vec, } //------------------------------------------------------------------------------ -// Get read-only access to a vector via the specified mem_type +// Get read-only access to a vector via the specified mem_type and precision //------------------------------------------------------------------------------ -static int CeedVectorGetArrayRead_Hip(const CeedVector vec, - const CeedMemType mem_type, const CeedScalar **array) { - return CeedVectorGetArrayCore_Hip(vec, mem_type, (CeedScalar **)array); +static int CeedVectorGetArrayReadGeneric_Hip(const CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType prec, + const void **array) { + return CeedVectorGetArrayCore_Hip(vec, mem_type, prec, (void **)array); } //------------------------------------------------------------------------------ // Get read/write access to a vector via the specified mem_type //------------------------------------------------------------------------------ -static int CeedVectorGetArray_Hip(const CeedVector vec, - const CeedMemType mem_type, - CeedScalar **array) { +static int CeedVectorGetArrayGeneric_Hip(const CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType prec, + void **array) { int ierr; CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - ierr = CeedVectorGetArrayCore_Hip(vec, mem_type, array); CeedChkBackend(ierr); + ierr = CeedVectorGetArrayCore_Hip(vec, mem_type, prec, array); + CeedChkBackend(ierr); ierr = CeedVectorSetAllInvalid_Hip(vec); CeedChkBackend(ierr); switch (mem_type) { @@ -453,10 +462,12 @@ static int CeedVectorGetArray_Hip(const CeedVector vec, } //------------------------------------------------------------------------------ -// Get write access to a vector via the specified mem_type +// Get write access to a vector via the specified mem_type and precision //------------------------------------------------------------------------------ -static int CeedVectorGetArrayWrite_Hip(const CeedVector vec, - const CeedMemType mem_type, CeedScalar **array) { +static int CeedVectorGetArrayWriteGeneric_Hip(const CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType prec, + void **array) { int ierr; CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -466,7 +477,7 @@ static int CeedVectorGetArrayWrite_Hip(const CeedVector vec, CeedChkBackend(ierr); if (!has_array_of_type) { // Allocate if array is not yet allocated - ierr = CeedVectorSetArray(vec, mem_type, CEED_COPY_VALUES, NULL); + ierr = CeedVectorSetArrayGeneric(vec, mem_type, prec, CEED_COPY_VALUES, NULL); CeedChkBackend(ierr); } else { // Select dirty array @@ -485,7 +496,7 @@ static int CeedVectorGetArrayWrite_Hip(const CeedVector vec, } } - return CeedVectorGetArray_Hip(vec, mem_type, array); + return CeedVectorGetArrayGeneric_Hip(vec, mem_type, prec, array); } //------------------------------------------------------------------------------ @@ -752,18 +763,18 @@ int CeedVectorCreate_Hip(CeedSize n, CeedVector vec) { ierr = CeedSetBackendFunction(ceed, "Vector", vec, "HasBorrowedArrayOfType", CeedVectorHasBorrowedArrayOfType_Hip); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetArray", - CeedVectorSetArray_Hip); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "TakeArray", - CeedVectorTakeArray_Hip); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetArrayGeneric", + CeedVectorSetArrayGeneric_Hip); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "TakeArrayGeneric", + CeedVectorTakeArrayGeneric_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetValue", (int (*)())(CeedVectorSetValue_Hip)); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArray", - CeedVectorGetArray_Hip); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayRead", - CeedVectorGetArrayRead_Hip); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayWrite", - CeedVectorGetArrayWrite_Hip); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayGeneric", + CeedVectorGetArrayGeneric_Hip); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayReadGeneric", + CeedVectorGetArrayReadGeneric_Hip); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayWriteGeneric", + CeedVectorGetArrayWriteGeneric_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "Norm", CeedVectorNorm_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "Reciprocal", diff --git a/backends/ref/ceed-ref-vector.c b/backends/ref/ceed-ref-vector.c index edb8209ae3..aea9507145 100644 --- a/backends/ref/ceed-ref-vector.c +++ b/backends/ref/ceed-ref-vector.c @@ -27,7 +27,7 @@ static int CeedVectorHasValidArray_Ref(CeedVector vec, bool *has_valid_array) { // Check if has borrowed array of given type //------------------------------------------------------------------------------ static inline int CeedVectorHasBorrowedArrayOfType_Ref(const CeedVector vec, - CeedMemType mem_type, bool *has_borrowed_array_of_type) { + CeedMemType mem_type, CeedScalarType prec, bool *has_borrowed_array_of_type) { int ierr; CeedVector_Ref *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -52,8 +52,9 @@ static inline int CeedVectorHasBorrowedArrayOfType_Ref(const CeedVector vec, //------------------------------------------------------------------------------ // Vector Set Array //------------------------------------------------------------------------------ -static int CeedVectorSetArray_Ref(CeedVector vec, CeedMemType mem_type, - CeedCopyMode copy_mode, CeedScalar *array) { +static int CeedVectorSetArrayGeneric_Ref(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, + CeedCopyMode copy_mode, void *array) { int ierr; CeedVector_Ref *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -76,18 +77,18 @@ static int CeedVectorSetArray_Ref(CeedVector vec, CeedMemType mem_type, impl->array_borrowed = NULL; impl->array = impl->array_owned; if (array) - memcpy(impl->array, array, length * sizeof(array[0])); + memcpy(impl->array, array, length * sizeof(CeedScalar)); break; case CEED_OWN_POINTER: ierr = CeedFree(&impl->array_owned); CeedChkBackend(ierr); - impl->array_owned = array; + impl->array_owned = (CeedScalar *) array; impl->array_borrowed = NULL; - impl->array = array; + impl->array = (CeedScalar *) array; break; case CEED_USE_POINTER: ierr = CeedFree(&impl->array_owned); CeedChkBackend(ierr); - impl->array_borrowed = array; - impl->array = array; + impl->array_borrowed = (CeedScalar *) array; + impl->array = (CeedScalar *) array; } return CEED_ERROR_SUCCESS; } @@ -95,8 +96,8 @@ static int CeedVectorSetArray_Ref(CeedVector vec, CeedMemType mem_type, //------------------------------------------------------------------------------ // Vector Take Array //------------------------------------------------------------------------------ -static int CeedVectorTakeArray_Ref(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { +static int CeedVectorTakeArrayGeneric_Ref(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array) { int ierr; CeedVector_Ref *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -114,7 +115,7 @@ static int CeedVectorTakeArray_Ref(CeedVector vec, CeedMemType mem_type, // Vector Get Array //------------------------------------------------------------------------------ static int CeedVectorGetArrayCore_Ref(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { + CeedScalarType prec, void **array) { int ierr; CeedVector_Ref *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -135,24 +136,28 @@ static int CeedVectorGetArrayCore_Ref(CeedVector vec, CeedMemType mem_type, //------------------------------------------------------------------------------ // Vector Get Array Read //------------------------------------------------------------------------------ -static int CeedVectorGetArrayRead_Ref(CeedVector vec, CeedMemType mem_type, - const CeedScalar **array) { - return CeedVectorGetArrayCore_Ref(vec, mem_type, (CeedScalar **)array); +static int CeedVectorGetArrayReadGeneric_Ref(CeedVector vec, + CeedMemType mem_type, + CeedScalarType prec, + const void **array) { + return CeedVectorGetArrayCore_Ref(vec, mem_type, prec, (void **)array); } //------------------------------------------------------------------------------ // Vector Get Array //------------------------------------------------------------------------------ -static int CeedVectorGetArray_Ref(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { - return CeedVectorGetArrayCore_Ref(vec, mem_type, array); +static int CeedVectorGetArrayGeneric_Ref(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array) { + return CeedVectorGetArrayCore_Ref(vec, mem_type, prec, array); } //------------------------------------------------------------------------------ // Vector Get Array Write //------------------------------------------------------------------------------ -static int CeedVectorGetArrayWrite_Ref(CeedVector vec, CeedMemType mem_type, - const CeedScalar **array) { +static int CeedVectorGetArrayWriteGeneric_Ref(CeedVector vec, + CeedMemType mem_type, + CeedScalarType prec, + const void **array) { int ierr; CeedVector_Ref *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); @@ -171,17 +176,17 @@ static int CeedVectorGetArrayWrite_Ref(CeedVector vec, CeedMemType mem_type, } } - return CeedVectorGetArrayCore_Ref(vec, mem_type, (CeedScalar **)array); + return CeedVectorGetArrayCore_Ref(vec, mem_type, prec, (void **) array); } //------------------------------------------------------------------------------ // Vector Restore Array //------------------------------------------------------------------------------ -static int CeedVectorRestoreArray_Ref(CeedVector vec) { +static int CeedVectorRestoreArrayGeneric_Ref(CeedVector vec) { return CEED_ERROR_SUCCESS; } -static int CeedVectorRestoreArrayRead_Ref(CeedVector vec) { +static int CeedVectorRestoreArrayReadGeneric_Ref(CeedVector vec) { return CEED_ERROR_SUCCESS; } @@ -212,20 +217,20 @@ int CeedVectorCreate_Ref(CeedSize n, CeedVector vec) { ierr = CeedSetBackendFunction(ceed, "Vector", vec, "HasBorrowedArrayOfType", CeedVectorHasBorrowedArrayOfType_Ref); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetArray", - CeedVectorSetArray_Ref); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "TakeArray", - CeedVectorTakeArray_Ref); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArray", - CeedVectorGetArray_Ref); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayRead", - CeedVectorGetArrayRead_Ref); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayWrite", - CeedVectorGetArrayWrite_Ref); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "RestoreArray", - CeedVectorRestoreArray_Ref); CeedChkBackend(ierr); - ierr = CeedSetBackendFunction(ceed, "Vector", vec, "RestoreArrayRead", - CeedVectorRestoreArrayRead_Ref); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetArrayGeneric", + CeedVectorSetArrayGeneric_Ref); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "TakeArrayGeneric", + CeedVectorTakeArrayGeneric_Ref); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayGeneric", + CeedVectorGetArrayGeneric_Ref); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayReadGeneric", + CeedVectorGetArrayReadGeneric_Ref); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayWriteGeneric", + CeedVectorGetArrayWriteGeneric_Ref); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "RestoreArrayGeneric", + CeedVectorRestoreArrayGeneric_Ref); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "RestoreArrayReadGeneric", + CeedVectorRestoreArrayReadGeneric_Ref); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "Destroy", CeedVectorDestroy_Ref); CeedChkBackend(ierr); diff --git a/include/ceed-impl.h b/include/ceed-impl.h index a1985e81b8..be1445adde 100644 --- a/include/ceed-impl.h +++ b/include/ceed-impl.h @@ -128,16 +128,18 @@ struct Ceed_private { struct CeedVector_private { Ceed ceed; int (*HasValidArray)(CeedVector, bool *); - int (*HasBorrowedArrayOfType)(CeedVector, CeedMemType, bool *); - int (*SetArray)(CeedVector, CeedMemType, CeedCopyMode, CeedScalar *); + int (*HasBorrowedArrayOfType)(CeedVector, CeedMemType, CeedScalarType, bool *); + int (*SetArrayGeneric)(CeedVector, CeedMemType, CeedScalarType, CeedCopyMode, + void *); int (*SetValue)(CeedVector, CeedScalar); - int (*SyncArray)(CeedVector, CeedMemType); - int (*TakeArray)(CeedVector, CeedMemType, CeedScalar **); - int (*GetArray)(CeedVector, CeedMemType, CeedScalar **); - int (*GetArrayRead)(CeedVector, CeedMemType, const CeedScalar **); - int (*GetArrayWrite)(CeedVector, CeedMemType, CeedScalar **); - int (*RestoreArray)(CeedVector); - int (*RestoreArrayRead)(CeedVector); + int (*SyncArrayGeneric)(CeedVector, CeedMemType, CeedScalarType); + int (*TakeArrayGeneric)(CeedVector, CeedMemType, CeedScalarType, void **); + int (*GetArrayGeneric)(CeedVector, CeedMemType, CeedScalarType, void **); + int (*GetArrayReadGeneric)(CeedVector, CeedMemType, CeedScalarType, + const void **); + int (*GetArrayWriteGeneric)(CeedVector, CeedMemType, CeedScalarType, void **); + int (*RestoreArrayGeneric)(CeedVector); + int (*RestoreArrayReadGeneric)(CeedVector); int (*Norm)(CeedVector, CeedNormType, CeedScalar *); int (*Scale)(CeedVector, CeedScalar); int (*AXPY)(CeedVector, CeedScalar, CeedVector); diff --git a/include/ceed/backend.h b/include/ceed/backend.h index 6156a1f881..aae6b1fcea 100644 --- a/include/ceed/backend.h +++ b/include/ceed/backend.h @@ -132,13 +132,28 @@ CEED_EXTERN int CeedReference(Ceed ceed); CEED_EXTERN int CeedVectorHasValidArray(CeedVector vec, bool *has_valid_array); CEED_EXTERN int CeedVectorHasBorrowedArrayOfType(CeedVector vec, CeedMemType mem_type, - bool *has_borrowed_array_of_type); -CEED_EXTERN int CeedVectorHasValidArray(CeedVector vec, bool *has_valid_array); + CeedScalarType prec, bool *has_borrowed_array_of_type); CEED_EXTERN int CeedVectorGetState(CeedVector vec, uint64_t *state); CEED_EXTERN int CeedVectorAddReference(CeedVector vec); CEED_EXTERN int CeedVectorGetData(CeedVector vec, void *data); CEED_EXTERN int CeedVectorSetData(CeedVector vec, void *data); CEED_EXTERN int CeedVectorReference(CeedVector vec); +CEED_EXTERN int CeedVectorSetArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, CeedCopyMode copy_mode, + void *array); +CEED_EXTERN int CeedVectorSyncArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec); +CEED_EXTERN int CeedVectorTakeArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array); +CEED_EXTERN int CeedVectorGetArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array); +CEED_EXTERN int CeedVectorGetArrayReadGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, const void **array); +CEED_EXTERN int CeedVectorGetArrayWriteGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array); +CEED_EXTERN int CeedVectorRestoreArrayGeneric(CeedVector vec, void **array); +CEED_EXTERN int CeedVectorRestoreArrayReadGeneric(CeedVector vec, + const void **array); CEED_EXTERN int CeedElemRestrictionGetStrides(CeedElemRestriction rstr, CeedInt (*strides)[3]); diff --git a/interface/ceed-vector.c b/interface/ceed-vector.c index eb40a4ba46..8151c54ec0 100644 --- a/interface/ceed-vector.c +++ b/interface/ceed-vector.c @@ -75,7 +75,7 @@ int CeedVectorHasValidArray(CeedVector vec, bool *has_valid_array) { @ref Backend **/ int CeedVectorHasBorrowedArrayOfType(CeedVector vec, CeedMemType mem_type, - bool *has_borrowed_array_of_type) { + CeedScalarType prec, bool *has_borrowed_array_of_type) { int ierr; if (!vec->HasBorrowedArrayOfType) @@ -84,7 +84,8 @@ int CeedVectorHasBorrowedArrayOfType(CeedVector vec, CeedMemType mem_type, "Backend does not support HasBorrowedArrayOfType"); // LCOV_EXCL_STOP - ierr = vec->HasBorrowedArrayOfType(vec, mem_type, has_borrowed_array_of_type); + ierr = vec->HasBorrowedArrayOfType(vec, mem_type, prec, + has_borrowed_array_of_type); CeedChk(ierr); return CEED_ERROR_SUCCESS; @@ -237,25 +238,27 @@ int CeedVectorReferenceCopy(CeedVector vec, CeedVector *vec_copy) { /** @brief Set the array used by a CeedVector, freeing any previously allocated array if applicable. The backend may copy values to a different - memtype, such as during @ref CeedOperatorApply(). + memtype and/or precision, such as during @ref CeedOperatorApply(). See also @ref CeedVectorSyncArray() and @ref CeedVectorTakeArray(). @param vec CeedVector @param mem_type Memory type of the array being passed + @param prec Scalar precision type of array being passed @param copy_mode Copy mode for the array @param array Array to be used, or NULL with @ref CEED_COPY_VALUES to have the library allocate + Intended for internal/backend use. @return An error code: 0 - success, otherwise - failure - @ref User + @ref Backend **/ -int CeedVectorSetArray(CeedVector vec, CeedMemType mem_type, - CeedCopyMode copy_mode, - CeedScalar *array) { +int CeedVectorSetArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, CeedCopyMode copy_mode, + void *array) { int ierr; - if (!vec->SetArray) + if (!vec->SetArrayGeneric) // LCOV_EXCL_START return CeedError(vec->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support VectorSetArray"); @@ -271,11 +274,35 @@ int CeedVectorSetArray(CeedVector vec, CeedMemType mem_type, "Cannot grant CeedVector array access, a " "process has read access"); - ierr = vec->SetArray(vec, mem_type, copy_mode, array); CeedChk(ierr); + ierr = vec->SetArrayGeneric(vec, mem_type, prec, copy_mode, array); + CeedChk(ierr); vec->state += 2; return CEED_ERROR_SUCCESS; } +/** + @brief Set the array used by a CeedVector, freeing any previously allocated + array if applicable. The backend may copy values to a different + memtype, such as during @ref CeedOperatorApply(). + See also @ref CeedVectorSyncArray() and @ref CeedVectorTakeArray(). + + @param vec CeedVector + @param mem_type Memory type of the array being passed + @param copy_mode Copy mode for the array + @param array Array to be used, or NULL with @ref CEED_COPY_VALUES to have the + library allocate + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorSetArray(CeedVector vec, CeedMemType mem_type, + CeedCopyMode copy_mode, + CeedScalar *array) { + return CeedVectorSetArrayGeneric(vec, mem_type, CEED_SCALAR_TYPE, copy_mode, + (void **) array); +} + /** @brief Set the CeedVector to a constant value @@ -316,19 +343,21 @@ int CeedVectorSetValue(CeedVector vec, CeedScalar value) { } /** - @brief Sync the CeedVector to a specified memtype. This function is used to - force synchronization of arrays set with @ref CeedVectorSetArray(). - If the requested memtype is already synchronized, this function - results in a no-op. + @brief Sync the CeedVector to a specified memtype and precision. This function + is used to force synchronization of arrays set with @ref CeedVectorSetArray(). + If the requested memtype/precision is already synchronized, this function + results in a no-op. Intended for internal/backend use. @param vec CeedVector @param mem_type Memtype to be synced + @param prec Scalar precision to be synced @return An error code: 0 - success, otherwise - failure - @ref User + @ref Backend **/ -int CeedVectorSyncArray(CeedVector vec, CeedMemType mem_type) { +int CeedVectorSyncArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec) { int ierr; if (vec->state % 2 == 1) @@ -336,35 +365,55 @@ int CeedVectorSyncArray(CeedVector vec, CeedMemType mem_type) { "Cannot sync CeedVector, the access lock is " "already in use"); - if (vec->SyncArray) { - ierr = vec->SyncArray(vec, mem_type); CeedChk(ierr); + if (vec->SyncArrayGeneric) { + ierr = vec->SyncArrayGeneric(vec, mem_type, prec); CeedChk(ierr); } else { - const CeedScalar *array; - ierr = CeedVectorGetArrayRead(vec, mem_type, &array); CeedChk(ierr); - ierr = CeedVectorRestoreArrayRead(vec, &array); CeedChk(ierr); + const void *array; + ierr = CeedVectorGetArrayReadGeneric(vec, mem_type, prec, &array); + CeedChk(ierr); + ierr = CeedVectorRestoreArrayReadGeneric(vec, &array); CeedChk(ierr); } return CEED_ERROR_SUCCESS; } /** - @brief Take ownership of the CeedVector array set by @ref CeedVectorSetArray() + @brief Sync the CeedVector to a specified memtype. This function is used to + force synchronization of arrays set with @ref CeedVectorSetArray(). + If the requested memtype is already synchronized, this function + results in a no-op. + + @param vec CeedVector + @param mem_type Memtype to be synced + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorSyncArray(CeedVector vec, CeedMemType mem_type) { + return CeedVectorSyncArrayGeneric(vec, mem_type, CEED_SCALAR_TYPE); +} + +/** + @brief Take ownership of the specified precision array set by @ref CeedVectorSetArray() with @ref CEED_USE_POINTER and remove the array from the CeedVector. The caller is responsible for managing and freeing the array. This function will error if @ref CeedVectorSetArray() was not previously called with @ref CEED_USE_POINTER for the corresponding mem_type. + Intended for internal/backend use. @param vec CeedVector @param mem_type Memory type on which to take the array. If the backend uses a different memory type, this will perform a copy. + @param prec Scalar precision type for which to take the array. @param[out] array Array on memory type mem_type, or NULL if array pointer is not required @return An error code: 0 - success, otherwise - failure - @ref User + @ref Backend **/ -int CeedVectorTakeArray(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { +int CeedVectorTakeArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array) { int ierr; if (vec->state % 2 == 1) @@ -379,10 +428,10 @@ int CeedVectorTakeArray(CeedVector vec, CeedMemType mem_type, "Cannot take CeedVector array, a process " "has read access"); // LCOV_EXCL_STOP - CeedScalar *temp_array = NULL; + void *temp_array = NULL; if (vec->length > 0) { bool has_borrowed_array_of_type = true; - ierr = CeedVectorHasBorrowedArrayOfType(vec, mem_type, + ierr = CeedVectorHasBorrowedArrayOfType(vec, mem_type, prec, &has_borrowed_array_of_type); CeedChk(ierr); if (!has_borrowed_array_of_type) @@ -401,19 +450,47 @@ int CeedVectorTakeArray(CeedVector vec, CeedMemType mem_type, "must set data with CeedVectorSetValue or CeedVectorSetArray"); // LCOV_EXCL_STOP - ierr = vec->TakeArray(vec, mem_type, &temp_array); CeedChk(ierr); + ierr = vec->TakeArrayGeneric(vec, mem_type, prec, &temp_array); CeedChk(ierr); } if (array) (*array) = temp_array; return CEED_ERROR_SUCCESS; } /** - @brief Get read/write access to a CeedVector via the specified memory type. - Restore access with @ref CeedVectorRestoreArray(). + @brief Take ownership of the CeedVector array set by @ref CeedVectorSetArray() + with @ref CEED_USE_POINTER and remove the array from the CeedVector. + The caller is responsible for managing and freeing the array. + This function will error if @ref CeedVectorSetArray() was not previously + called with @ref CEED_USE_POINTER for the corresponding mem_type. + + @param vec CeedVector + @param mem_type Memory type on which to take the array. If the backend + uses a different memory type, this will perform a copy. + @param[out] array Array on memory type mem_type, or NULL if array pointer is + not required + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorTakeArray(CeedVector vec, CeedMemType mem_type, + CeedScalar **array) { + return CeedVectorTakeArrayGeneric(vec, mem_type, CEED_SCALAR_TYPE, + (void **) array); +} + +/** + @brief Get read/write access to a CeedVector via the specified memory type + and scalar precision. + Restore access with @ref CeedVectorRestoreArrayGeneric(). + Intended for internal/backend use. @param vec CeedVector to access @param mem_type Memory type on which to access the array. If the backend uses a different memory type, this will perform a copy. + @param prec Scalar precision type for which to access the array. If + the data is currently in a different precision, this will + perform a copy and invalidate all other precisions. @param[out] array Array on memory type mem_type @note The CeedVectorGetArray* and CeedVectorRestoreArray* functions provide @@ -423,13 +500,13 @@ int CeedVectorTakeArray(CeedVector vec, CeedMemType mem_type, @return An error code: 0 - success, otherwise - failure - @ref User + @ref Backend **/ -int CeedVectorGetArray(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { +int CeedVectorGetArrayGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array) { int ierr; - if (!vec->GetArray) + if (!vec->GetArrayGeneric) // LCOV_EXCL_START return CeedError(vec->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support GetArray"); @@ -454,30 +531,57 @@ int CeedVectorGetArray(CeedVector vec, CeedMemType mem_type, "must set data with CeedVectorSetValue or CeedVectorSetArray"); // LCOV_EXCL_STOP - ierr = vec->GetArray(vec, mem_type, array); CeedChk(ierr); + ierr = vec->GetArrayGeneric(vec, mem_type, prec, array); CeedChk(ierr); vec->state++; return CEED_ERROR_SUCCESS; } /** - @brief Get read-only access to a CeedVector via the specified memory type. - Restore access with @ref CeedVectorRestoreArrayRead(). + @brief Get read/write access to a CeedVector via the specified memory type. + Restore access with @ref CeedVectorRestoreArray(). + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. If the backend + uses a different memory type, this will perform a copy. + @param[out] array Array on memory type mem_type + + @note The CeedVectorGetArray* and CeedVectorRestoreArray* functions provide + access to array pointers in the desired memory space. Pairing get/restore + allows the Vector to track access, thus knowing if norms or other + operations may need to be recomputed. + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArray(CeedVector vec, CeedMemType mem_type, + CeedScalar **array) { + return CeedVectorGetArrayGeneric(vec, mem_type, CEED_SCALAR_TYPE, + (void **) array); +} + +/** + @brief Get read-only access to a CeedVector via the specified memory type + and precision. + Restore access with @ref CeedVectorRestoreArrayReadGeneric(). + Intended for internal/backend use. @param vec CeedVector to access @param mem_type Memory type on which to access the array. If the backend uses a different memory type, this will perform a copy (possibly cached). + @param prec @param[out] array Array on memory type mem_type @return An error code: 0 - success, otherwise - failure - @ref User + @ref Backend **/ -int CeedVectorGetArrayRead(CeedVector vec, CeedMemType mem_type, - const CeedScalar **array) { +int CeedVectorGetArrayReadGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, const void **array) { int ierr; - if (!vec->GetArrayRead) + if (!vec->GetArrayReadGeneric) // LCOV_EXCL_START return CeedError(vec->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support GetArrayRead"); @@ -498,7 +602,7 @@ int CeedVectorGetArrayRead(CeedVector vec, CeedMemType mem_type, "must set data with CeedVectorSetValue or CeedVectorSetArray"); // LCOV_EXCL_STOP - ierr = vec->GetArrayRead(vec, mem_type, array); CeedChk(ierr); + ierr = vec->GetArrayReadGeneric(vec, mem_type, prec, array); CeedChk(ierr); } else { *array = NULL; } @@ -507,23 +611,47 @@ int CeedVectorGetArrayRead(CeedVector vec, CeedMemType mem_type, } /** - @brief Get write access to a CeedVector via the specified memory type. - Restore access with @ref CeedVectorRestoreArray(). All old + @brief Get read-only access to a CeedVector via the specified memory type. + Restore access with @ref CeedVectorRestoreArrayRead(). + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. If the backend + uses a different memory type, this will perform a copy + (possibly cached). + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayRead(CeedVector vec, CeedMemType mem_type, + const CeedScalar **array) { + return CeedVectorGetArrayReadGeneric(vec, mem_type, CEED_SCALAR_TYPE, + (const void **) array); +} + +/** + @brief Get write access to a CeedVector via the specified memory type and + precision. + Restore access with @ref CeedVectorRestoreArrayGeneric(). All old values should be assumed to be invalid. + Intended for internal/backend use. @param vec CeedVector to access @param mem_type Memory type on which to access the array. + @param prec Scalar precision type for which to access the array. Any other + precisions contained in the vector will become invalid. @param[out] array Array on memory type mem_type @return An error code: 0 - success, otherwise - failure - @ref User + @ref Backend **/ -int CeedVectorGetArrayWrite(CeedVector vec, CeedMemType mem_type, - CeedScalar **array) { +int CeedVectorGetArrayWriteGeneric(CeedVector vec, CeedMemType mem_type, + CeedScalarType prec, void **array) { int ierr; - if (!vec->GetArrayWrite) + if (!vec->GetArrayWriteGeneric) // LCOV_EXCL_START return CeedError(vec->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support GetArrayWrite"); @@ -543,31 +671,50 @@ int CeedVectorGetArrayWrite(CeedVector vec, CeedMemType mem_type, "process has read access"); // LCOV_EXCL_STOP - ierr = vec->GetArrayWrite(vec, mem_type, array); CeedChk(ierr); + ierr = vec->GetArrayWriteGeneric(vec, mem_type, prec, array); CeedChk(ierr); vec->state++; return CEED_ERROR_SUCCESS; } /** - @brief Restore an array obtained using @ref CeedVectorGetArray() - or @ref CeedVectorGetArrayWrite() + @brief Get write access to a CeedVector via the specified memory type. + Restore access with @ref CeedVectorRestoreArray(). All old + values should be assumed to be invalid. + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayWrite(CeedVector vec, CeedMemType mem_type, + CeedScalar **array) { + return CeedVectorGetArrayWriteGeneric(vec, mem_type, CEED_SCALAR_TYPE, + (void **) array); +} + +/** + @brief Restore an array obtained using @ref CeedVectorGetArrayGeneric() + or @ref CeedVectorGetArrayWriteGeneric() @param vec CeedVector to restore @param array Array of vector data @return An error code: 0 - success, otherwise - failure - @ref User + @ref Backend **/ -int CeedVectorRestoreArray(CeedVector vec, CeedScalar **array) { +int CeedVectorRestoreArrayGeneric(CeedVector vec, void **array) { int ierr; if (vec->state % 2 != 1) return CeedError(vec->ceed, CEED_ERROR_ACCESS, "Cannot restore CeedVector array access, " "access was not granted"); - if (vec->RestoreArray) { - ierr = vec->RestoreArray(vec); CeedChk(ierr); + if (vec->RestoreArrayGeneric) { + ierr = vec->RestoreArrayGeneric(vec); CeedChk(ierr); } *array = NULL; vec->state++; @@ -575,7 +722,8 @@ int CeedVectorRestoreArray(CeedVector vec, CeedScalar **array) { } /** - @brief Restore an array obtained using @ref CeedVectorGetArrayRead() + @brief Restore an array obtained using @ref CeedVectorGetArray() + or @ref CeedVectorGetArrayWrite() @param vec CeedVector to restore @param array Array of vector data @@ -584,7 +732,21 @@ int CeedVectorRestoreArray(CeedVector vec, CeedScalar **array) { @ref User **/ -int CeedVectorRestoreArrayRead(CeedVector vec, const CeedScalar **array) { +int CeedVectorRestoreArray(CeedVector vec, CeedScalar **array) { + return CeedVectorRestoreArrayGeneric(vec, (void **) array); +} + +/** + @brief Restore an array obtained using @ref CeedVectorGetArrayReadGeneric() + + @param vec CeedVector to restore + @param array Array of vector data + + @return An error code: 0 - success, otherwise - failure + + @ref Backend +**/ +int CeedVectorRestoreArrayReadGeneric(CeedVector vec, const void **array) { int ierr; if (vec->num_readers == 0) @@ -594,14 +756,28 @@ int CeedVectorRestoreArrayRead(CeedVector vec, const CeedScalar **array) { "access was not granted"); // LCOV_EXCL_STOP - if (vec->RestoreArrayRead) { - ierr = vec->RestoreArrayRead(vec); CeedChk(ierr); + if (vec->RestoreArrayReadGeneric) { + ierr = vec->RestoreArrayReadGeneric(vec); CeedChk(ierr); } *array = NULL; vec->num_readers--; return CEED_ERROR_SUCCESS; } +/** + @brief Restore an array obtained using @ref CeedVectorGetArrayRead() + + @param vec CeedVector to restore + @param array Array of vector data + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorRestoreArrayRead(CeedVector vec, const CeedScalar **array) { + return CeedVectorRestoreArrayReadGeneric(vec, (const void **) array); +} + /** @brief Get the norm of a CeedVector. diff --git a/interface/ceed.c b/interface/ceed.c index 52961af6e9..bb46ddcda8 100644 --- a/interface/ceed.c +++ b/interface/ceed.c @@ -839,14 +839,14 @@ int CeedInit(const char *resource, Ceed *ceed) { CEED_FTABLE_ENTRY(Ceed, CompositeOperatorCreate), CEED_FTABLE_ENTRY(CeedVector, HasValidArray), CEED_FTABLE_ENTRY(CeedVector, HasBorrowedArrayOfType), - CEED_FTABLE_ENTRY(CeedVector, SetArray), - CEED_FTABLE_ENTRY(CeedVector, TakeArray), + CEED_FTABLE_ENTRY(CeedVector, SetArrayGeneric), + CEED_FTABLE_ENTRY(CeedVector, TakeArrayGeneric), CEED_FTABLE_ENTRY(CeedVector, SetValue), - CEED_FTABLE_ENTRY(CeedVector, GetArray), - CEED_FTABLE_ENTRY(CeedVector, GetArrayRead), - CEED_FTABLE_ENTRY(CeedVector, GetArrayWrite), - CEED_FTABLE_ENTRY(CeedVector, RestoreArray), - CEED_FTABLE_ENTRY(CeedVector, RestoreArrayRead), + CEED_FTABLE_ENTRY(CeedVector, GetArrayGeneric), + CEED_FTABLE_ENTRY(CeedVector, GetArrayReadGeneric), + CEED_FTABLE_ENTRY(CeedVector, GetArrayWriteGeneric), + CEED_FTABLE_ENTRY(CeedVector, RestoreArrayGeneric), + CEED_FTABLE_ENTRY(CeedVector, RestoreArrayReadGeneric), CEED_FTABLE_ENTRY(CeedVector, Norm), CEED_FTABLE_ENTRY(CeedVector, Scale), CEED_FTABLE_ENTRY(CeedVector, AXPY), From 775eb4c37f29825cb810a2311f478a38208522e3 Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Wed, 6 Apr 2022 17:44:41 -0600 Subject: [PATCH 02/10] WIP multiprecision vectors: adding multiprecision storage and some fcns to hip-ref --- backends/hip-ref/ceed-hip-ref-vector.c | 638 ++++++++++++++---- backends/hip-ref/ceed-hip-ref.h | 12 +- .../hip-ref/kernels/hip-ref-vector.hip.cpp | 55 ++ include/ceed/ceed.h | 8 +- 4 files changed, 574 insertions(+), 139 deletions(-) diff --git a/backends/hip-ref/ceed-hip-ref-vector.c b/backends/hip-ref/ceed-hip-ref-vector.c index a485c6ff2b..be042ffb9c 100644 --- a/backends/hip-ref/ceed-hip-ref-vector.c +++ b/backends/hip-ref/ceed-hip-ref-vector.c @@ -16,7 +16,30 @@ //------------------------------------------------------------------------------ // Sync host to device //------------------------------------------------------------------------------ -static inline int CeedVectorSyncH2D_Hip(const CeedVector vec) { +static inline int CeedScalarTypeGetSize_Hip(Ceed ceed, CeedScalarType prec, + size_t *size) { + switch(prec) { + case CEED_SCALAR_FP32: + *size = sizeof(float); + break; + case CEED_SCALAR_FP64: + *size = sizeof(double); + break; + default: + // LCOV_EXCL_START + return CeedError(ceed, CEED_ERROR_BACKEND, + "Invalid scalar precision type specified"); + // LCOV_EXCL_STOP + } + return CEED_ERROR_SUCCESS; +} + + +//------------------------------------------------------------------------------ +// Sync host to device +//------------------------------------------------------------------------------ +static inline int CeedVectorSyncH2D_Hip(const CeedVector vec, + const CeedScalarType prec) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); @@ -25,26 +48,29 @@ static inline int CeedVectorSyncH2D_Hip(const CeedVector vec) { CeedSize length; ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - size_t bytes = length * sizeof(CeedScalar); + size_t prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + size_t bytes = length * prec_size; - if (!impl->h_array) + if (!impl->h_array.values[prec]) // LCOV_EXCL_START return CeedError(ceed, CEED_ERROR_BACKEND, "No valid host data to sync to device"); // LCOV_EXCL_STOP - if (impl->d_array_borrowed) { - impl->d_array = impl->d_array_borrowed; - } else if (impl->d_array_owned) { - impl->d_array = impl->d_array_owned; + if (impl->d_array_borrowed.values[prec]) { + impl->d_array.values[prec] = impl->d_array_borrowed.values[prec]; + } else if (impl->d_array_owned.values[prec]) { + impl->d_array.values[prec] = impl->d_array_owned.values[prec]; } else { - ierr = hipMalloc((void **)&impl->d_array_owned, bytes); + ierr = hipMalloc((void **)&impl->d_array_owned.values[prec], bytes); CeedChk_Hip(ceed, ierr); - impl->d_array = impl->d_array_owned; + impl->d_array.values[prec] = impl->d_array_owned.values[prec]; } - ierr = hipMemcpy(impl->d_array, impl->h_array, bytes, - hipMemcpyHostToDevice); CeedChk_Hip(ceed, ierr); + ierr = hipMemcpy(impl->d_array.values[prec], impl->h_array.values[prec], + bytes, hipMemcpyHostToDevice); CeedChk_Hip(ceed, ierr); return CEED_ERROR_SUCCESS; } @@ -52,35 +78,41 @@ static inline int CeedVectorSyncH2D_Hip(const CeedVector vec) { //------------------------------------------------------------------------------ // Sync device to host //------------------------------------------------------------------------------ -static inline int CeedVectorSyncD2H_Hip(const CeedVector vec) { +static inline int CeedVectorSyncD2H_Hip(const CeedVector vec, + const CeedScalarType prec) { int ierr; Ceed ceed; ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - if (!impl->d_array) + if (!impl->d_array.values[prec]) // LCOV_EXCL_START return CeedError(ceed, CEED_ERROR_BACKEND, "No valid device data to sync to host"); // LCOV_EXCL_STOP - if (impl->h_array_borrowed) { - impl->h_array = impl->h_array_borrowed; - } else if (impl->h_array_owned) { - impl->h_array = impl->h_array_owned; + CeedSize length; + ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); + size_t prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + size_t bytes = length * prec_size; + + if (impl->h_array_borrowed.values[prec]) { + impl->h_array.values[prec] = impl->h_array_borrowed.values[prec]; + } else if (impl->h_array_owned.values[prec]) { + impl->h_array.values[prec] = impl->h_array_owned.values[prec]; } else { CeedSize length; ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - ierr = CeedCalloc(length, &impl->h_array_owned); CeedChkBackend(ierr); - impl->h_array = impl->h_array_owned; + ierr = CeedCallocArray(length, prec_size,&impl->h_array_owned.values[prec]); + CeedChkBackend(ierr); + impl->h_array.values[prec] = impl->h_array_owned.values[prec]; } - CeedSize length; - ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - size_t bytes = length * sizeof(CeedScalar); - ierr = hipMemcpy(impl->h_array, impl->d_array, bytes, - hipMemcpyDeviceToHost); CeedChk_Hip(ceed, ierr); + ierr = hipMemcpy(impl->h_array.values[prec], impl->d_array.values[prec], + bytes, hipMemcpyDeviceToHost); CeedChk_Hip(ceed, ierr); return CEED_ERROR_SUCCESS; } @@ -89,10 +121,174 @@ static inline int CeedVectorSyncD2H_Hip(const CeedVector vec) { // Sync arrays //------------------------------------------------------------------------------ static inline int CeedVectorSync_Hip(const CeedVector vec, - CeedMemType mem_type) { + CeedMemType mem_type, + CeedScalarType prec) { switch (mem_type) { - case CEED_MEM_HOST: return CeedVectorSyncD2H_Hip(vec); - case CEED_MEM_DEVICE: return CeedVectorSyncH2D_Hip(vec); + case CEED_MEM_HOST: return CeedVectorSyncD2H_Hip(vec, prec); + case CEED_MEM_DEVICE: return CeedVectorSyncH2D_Hip(vec, prec); + } + return CEED_ERROR_UNSUPPORTED; +} + + +//------------------------------------------------------------------------------ +// Convert vector's host array to new precision. +//------------------------------------------------------------------------------ +static int CeedVectorConvertArrayHost_Hip(CeedVector vec, + const CeedScalarType from_prec, const CeedScalarType to_prec) { + CeedInt ierr; + CeedSize length; + ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); + CeedVector_Hip *data; + ierr = CeedVectorGetData(vec, &data); CeedChkBackend(ierr); + + switch (from_prec) { + + case CEED_SCALAR_FP64: + switch (to_prec) { + case CEED_SCALAR_FP64: + // No conversion needed + break; + case CEED_SCALAR_FP32: + if (!data->h_array.values[CEED_SCALAR_FP32]) { + if (!data->h_array_owned.values[CEED_SCALAR_FP32]) { + ierr = CeedMalloc(length, + (float **) &data->h_array_owned.values[CEED_SCALAR_FP32]); + CeedChkBackend(ierr); + } + // Use owned memory + data->h_array.values[CEED_SCALAR_FP32] = + data->h_array_owned.values[CEED_SCALAR_FP32]; + } + float *float_data = (float *) data->h_array.values[CEED_SCALAR_FP32]; + double *double_data = (double *) data->h_array.values[CEED_SCALAR_FP64]; + for (int i = 0; i < length; i++) + float_data[i] = (float) double_data[i]; + break; + } + break; + + case CEED_SCALAR_FP32: + switch (to_prec) { + case CEED_SCALAR_FP64: + if (!data->h_array.values[CEED_SCALAR_FP64]) { + if (!data->h_array_owned.values[CEED_SCALAR_FP64]) { + ierr = CeedMalloc(length, + (double **) &data->h_array_owned.values[CEED_SCALAR_FP64]); + CeedChkBackend(ierr); + } + // Use owned memory + data->h_array.values[CEED_SCALAR_FP64] = + data->h_array_owned.values[CEED_SCALAR_FP64]; + } + float *float_data = (float *) data->h_array.values[CEED_SCALAR_FP32]; + double *double_data = (double *) data->h_array.values[CEED_SCALAR_FP64]; + for (int i = 0; i < length; i++) + double_data[i] = (double) float_data[i]; + break; + case CEED_SCALAR_FP32: + // No conversion needed + break; + } + break; + } + return CEED_ERROR_SUCCESS; +} + +//------------------------------------------------------------------------------ +// Convert a double-precision array to single precision +//------------------------------------------------------------------------------ +int CeedDeviceConvertArray_Hip_Fp64_Fp32(CeedInt length, + double *double_data, float *float_data); + +//------------------------------------------------------------------------------ +// Convert a single-precision array to double precision +//------------------------------------------------------------------------------ +int CeedDeviceConvertArray_Hip_Fp32_Fp64(CeedInt length, + float *float_data, double *double_data); + +//------------------------------------------------------------------------------ +// Convert device array to new precision(impl of individual functions/kernels in +// .hip.cpp file) +//------------------------------------------------------------------------------ +static int CeedVectorConvertArrayDevice_Hip(CeedVector vec, + const CeedScalarType from_prec, const CeedScalarType to_prec) { + + CeedSize length; + CeedInt ierr; + Ceed ceed; + ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); + ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); + CeedVector_Hip *data; + ierr = CeedVectorGetData(vec, &data); CeedChkBackend(ierr); + switch (from_prec) { + + case CEED_SCALAR_FP64: + switch (to_prec) { + case CEED_SCALAR_FP64: + // No conversion needed + break; + case CEED_SCALAR_FP32: + if (!data->d_array.values[CEED_SCALAR_FP32]) { + if (!data->d_array_owned.values[CEED_SCALAR_FP32]) { + size_t bytes = length * sizeof(float); + ierr = hipMalloc((void **)&data->d_array_owned.values[CEED_SCALAR_FP32], + bytes); + CeedChk_Hip(ceed, ierr); + } + // Use owned memory + data->d_array.values[CEED_SCALAR_FP32] = + data->d_array_owned.values[CEED_SCALAR_FP32]; + } + ierr = CeedDeviceConvertArray_Hip_Fp64_Fp32(length, + (double *) data->d_array.values[CEED_SCALAR_FP64], + (float *) data->d_array.values[CEED_SCALAR_FP32]); + CeedChkBackend(ierr); + break; + } + break; + + case CEED_SCALAR_FP32: + switch (to_prec) { + case CEED_SCALAR_FP64: + if (!data->d_array.values[CEED_SCALAR_FP64]) { + if (!data->d_array_owned.values[CEED_SCALAR_FP64]) { + size_t bytes = length * sizeof(double); + ierr = hipMalloc((void **)&data->d_array_owned.values[CEED_SCALAR_FP64], + bytes); + CeedChk_Hip(ceed, ierr); + } + // Use owned memory + data->d_array.values[CEED_SCALAR_FP64] = + data->d_array_owned.values[CEED_SCALAR_FP64]; + } + ierr = CeedDeviceConvertArray_Hip_Fp32_Fp64(length, + (float *) data->d_array.values[CEED_SCALAR_FP32], + (double *) data->d_array.values[CEED_SCALAR_FP64]); + CeedChkBackend(ierr); + break; + case CEED_SCALAR_FP32: + // No conversion needed + break; + } + break; + } + return CEED_ERROR_SUCCESS; +} + +//------------------------------------------------------------------------------ +// Convert data array from one precision to another (through copy/cast). +//------------------------------------------------------------------------------ +static int CeedVectorConvertArray_Hip(CeedVector vec, + const CeedMemType mem_type, + const CeedScalarType from_prec, + const CeedScalarType to_prec) { + + switch (mem_type) { + case CEED_MEM_HOST: return CeedVectorConvertArrayHost_Hip(vec, from_prec, + to_prec); + case CEED_MEM_DEVICE: return CeedVectorConvertArrayDevice_Hip(vec, from_prec, + to_prec); } return CEED_ERROR_UNSUPPORTED; } @@ -105,12 +301,50 @@ static inline int CeedVectorSetAllInvalid_Hip(const CeedVector vec) { CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - impl->h_array = NULL; - impl->d_array = NULL; + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + impl->h_array.values[i] = NULL; + impl->d_array.values[i] = NULL; + } return CEED_ERROR_SUCCESS; } +//------------------------------------------------------------------------------ +// Return the scalar type of the valid array on mem_type, or the "preferred +// precision" for copying, if more than one precision is valid. If no +// precisions are valid on the specified mem_type, it will return +// CEED_SCALAR_TYPE (default precision); you should check for a valid array +// separately. +//------------------------------------------------------------------------------ +static inline int CeedVectorGetPrecision_Hip(const CeedVector vec, + const CeedMemType mem_type, CeedScalarType *preferred_precision) { + + int ierr; + CeedVector_Hip *impl; + ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + + *preferred_precision = CEED_SCALAR_TYPE; + // Check for valid precisions, from most to least precise precise (we want + // the most precision if multiple arrays are valid) + switch (mem_type) { + case CEED_MEM_HOST: + if (!!impl->h_array.values[CEED_SCALAR_FP64]) + *preferred_precision = CEED_SCALAR_FP64; + else if (!!impl->h_array.values[CEED_SCALAR_FP32]) + *preferred_precision = CEED_SCALAR_FP32; + break; + case CEED_MEM_DEVICE: + if (!!impl->d_array.values[CEED_SCALAR_FP64]) + *preferred_precision = CEED_SCALAR_FP64; + else if (!!impl->d_array.values[CEED_SCALAR_FP32]) + *preferred_precision = CEED_SCALAR_FP32; + break; + } + + return CEED_ERROR_SUCCESS; +} + + //------------------------------------------------------------------------------ // Check if CeedVector has any valid pointers //------------------------------------------------------------------------------ @@ -120,7 +354,39 @@ static inline int CeedVectorHasValidArray_Hip(const CeedVector vec, CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - *has_valid_array = !!impl->h_array || !!impl->d_array; + *has_valid_array = false; + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + *has_valid_array = *has_valid_array || + (!!impl->h_array.values[i] || !!impl->d_array.values[i]); + } + + return CEED_ERROR_SUCCESS; +} + +//------------------------------------------------------------------------------ +// Check if has valid array of given memory type +//------------------------------------------------------------------------------ +static inline int CeedVectorHasValidArrayOfMemType_Hip(const CeedVector vec, + CeedMemType mem_type, bool *has_valid_array_of_mem_type) { + int ierr; + CeedVector_Hip *impl; + ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + + *has_valid_array_of_mem_type = false; + switch (mem_type) { + case CEED_MEM_HOST: + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + *has_valid_array_of_mem_type = *has_valid_array_of_mem_type || + !!impl->h_array.values[i]; + } + break; + case CEED_MEM_DEVICE: + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + *has_valid_array_of_mem_type = *has_valid_array_of_mem_type || + !!impl->d_array.values[i]; + } + break; + } return CEED_ERROR_SUCCESS; } @@ -129,17 +395,19 @@ static inline int CeedVectorHasValidArray_Hip(const CeedVector vec, // Check if has any array of given type //------------------------------------------------------------------------------ static inline int CeedVectorHasArrayOfType_Hip(const CeedVector vec, - CeedMemType mem_type, bool *has_array_of_type) { + CeedMemType mem_type, CeedScalarType prec, bool *has_array_of_type) { int ierr; CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); switch (mem_type) { case CEED_MEM_HOST: - *has_array_of_type = !!impl->h_array_borrowed || !!impl->h_array_owned; + *has_array_of_type = !!impl->h_array_borrowed.values[prec] || + !!impl->h_array_owned.values[prec]; break; case CEED_MEM_DEVICE: - *has_array_of_type = !!impl->d_array_borrowed || !!impl->d_array_owned; + *has_array_of_type = !!impl->d_array_borrowed.values[prec] || + !!impl->d_array_owned.values[prec]; break; } @@ -158,10 +426,10 @@ static inline int CeedVectorHasBorrowedArrayOfType_Hip(const CeedVector vec, switch (mem_type) { case CEED_MEM_HOST: - *has_borrowed_array_of_type = !!impl->h_array_borrowed; + *has_borrowed_array_of_type = !!impl->h_array_borrowed.values[prec]; break; case CEED_MEM_DEVICE: - *has_borrowed_array_of_type = !!impl->d_array_borrowed; + *has_borrowed_array_of_type = !!impl->d_array_borrowed.values[prec]; break; } @@ -169,7 +437,7 @@ static inline int CeedVectorHasBorrowedArrayOfType_Hip(const CeedVector vec, } //------------------------------------------------------------------------------ -// Sync array of given type +// Check if the only current valid array is on another MemType than mem_type //------------------------------------------------------------------------------ static inline int CeedVectorNeedSync_Hip(const CeedVector vec, CeedMemType mem_type, bool *need_sync) { @@ -179,14 +447,13 @@ static inline int CeedVectorNeedSync_Hip(const CeedVector vec, bool has_valid_array = false; ierr = CeedVectorHasValidArray(vec, &has_valid_array); CeedChkBackend(ierr); - switch (mem_type) { - case CEED_MEM_HOST: - *need_sync = has_valid_array && !impl->h_array; - break; - case CEED_MEM_DEVICE: - *need_sync = has_valid_array && !impl->d_array; - break; - } + bool has_valid_array_of_mem_type = false; + ierr = CeedVectorHasValidArrayOfMemType_Hip(vec, mem_type, + &has_valid_array_of_mem_type); + CeedChkBackend(ierr); + + // Check if we have a valid array, but not for the correct memory type + *need_sync = has_valid_array && !has_valid_array_of_mem_type; return CEED_ERROR_SUCCESS; } @@ -195,37 +462,45 @@ static inline int CeedVectorNeedSync_Hip(const CeedVector vec, // Set array from host //------------------------------------------------------------------------------ static int CeedVectorSetArrayHost_Hip(const CeedVector vec, + const CeedScalarType prec, const CeedCopyMode copy_mode, void *array) { int ierr; CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + Ceed ceed; + ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); + size_t prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + switch (copy_mode) { case CEED_COPY_VALUES: { CeedSize length; - if (!impl->h_array_owned) { + if (!impl->h_array_owned.values[prec]) { ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - ierr = CeedMalloc(length, &impl->h_array_owned); CeedChkBackend(ierr); + ierr = CeedMallocArray(length, prec_size, &impl->h_array_owned.values[prec]); + CeedChkBackend(ierr); } - impl->h_array_borrowed = NULL; - impl->h_array = impl->h_array_owned; + impl->h_array_borrowed.values[prec] = NULL; + impl->h_array.values[prec] = impl->h_array_owned.values[prec]; if (array) { CeedSize length; ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - size_t bytes = length * sizeof(CeedScalar); - memcpy(impl->h_array, array, bytes); + size_t bytes = length * prec_size; + memcpy(impl->h_array.values[prec], array, bytes); } } break; case CEED_OWN_POINTER: - ierr = CeedFree(&impl->h_array_owned); CeedChkBackend(ierr); - impl->h_array_owned = array; - impl->h_array_borrowed = NULL; - impl->h_array = array; + ierr = CeedFree(&impl->h_array_owned.values[prec]); CeedChkBackend(ierr); + impl->h_array_owned.values[prec] = array; + impl->h_array_borrowed.values[prec] = NULL; + impl->h_array.values[prec] = array; break; case CEED_USE_POINTER: - ierr = CeedFree(&impl->h_array_owned); CeedChkBackend(ierr); - impl->h_array_borrowed = array; - impl->h_array = array; + ierr = CeedFree(&impl->h_array_owned.values[prec]); CeedChkBackend(ierr); + impl->h_array_borrowed.values[prec] = array; + impl->h_array.values[prec] = array; break; } @@ -236,6 +511,7 @@ static int CeedVectorSetArrayHost_Hip(const CeedVector vec, // Set array from device //------------------------------------------------------------------------------ static int CeedVectorSetArrayDevice_Hip(const CeedVector vec, + const CeedScalarType prec, const CeedCopyMode copy_mode, void *array) { int ierr; Ceed ceed; @@ -243,33 +519,37 @@ static int CeedVectorSetArrayDevice_Hip(const CeedVector vec, CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + size_t prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + switch (copy_mode) { case CEED_COPY_VALUES: { CeedSize length; ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - size_t bytes = length * sizeof(CeedScalar); - if (!impl->d_array_owned) { - ierr = hipMalloc((void **)&impl->d_array_owned, bytes); + size_t bytes = length * prec_size; + if (!impl->d_array_owned.values[prec]) { + ierr = hipMalloc((void **)&impl->d_array_owned.values[prec], bytes); CeedChk_Hip(ceed, ierr); } - impl->d_array_borrowed = NULL; - impl->d_array = impl->d_array_owned; + impl->d_array_borrowed.values[prec] = NULL; + impl->d_array.values[prec] = impl->d_array_owned.values[prec]; if (array) { - ierr = hipMemcpy(impl->d_array, array, bytes, + ierr = hipMemcpy(impl->d_array.values[prec], array, bytes, hipMemcpyDeviceToDevice); CeedChk_Hip(ceed, ierr); } } break; case CEED_OWN_POINTER: - ierr = hipFree(impl->d_array_owned); CeedChk_Hip(ceed, ierr); - impl->d_array_owned = array; - impl->d_array_borrowed = NULL; - impl->d_array = array; + ierr = hipFree(impl->d_array_owned.values[prec]); CeedChk_Hip(ceed, ierr); + impl->d_array_owned.values[prec] = array; + impl->d_array_borrowed.values[prec] = NULL; + impl->d_array.values[prec] = array; break; case CEED_USE_POINTER: - ierr = hipFree(impl->d_array_owned); CeedChk_Hip(ceed, ierr); - impl->d_array_owned = NULL; - impl->d_array_borrowed = array; - impl->d_array = array; + ierr = hipFree(impl->d_array_owned.values[prec]); CeedChk_Hip(ceed, ierr); + impl->d_array_owned.values[prec] = NULL; + impl->d_array_borrowed.values[prec] = array; + impl->d_array.values[prec] = array; break; } @@ -293,9 +573,9 @@ static int CeedVectorSetArrayGeneric_Hip(const CeedVector vec, ierr = CeedVectorSetAllInvalid_Hip(vec); CeedChkBackend(ierr); switch (mem_type) { case CEED_MEM_HOST: - return CeedVectorSetArrayHost_Hip(vec, copy_mode, array); + return CeedVectorSetArrayHost_Hip(vec, prec, copy_mode, array); case CEED_MEM_DEVICE: - return CeedVectorSetArrayDevice_Hip(vec, copy_mode, array); + return CeedVectorSetArrayDevice_Hip(vec, prec, copy_mode, array); } return CEED_ERROR_UNSUPPORTED; @@ -317,7 +597,7 @@ static int CeedHostSetValue_Hip(CeedScalar *h_array, CeedInt length, int CeedDeviceSetValue_Hip(CeedScalar *d_array, CeedInt length, CeedScalar val); //------------------------------------------------------------------------------ -// Set a vector to a value, +// Set a vector to a value //------------------------------------------------------------------------------ static int CeedVectorSetValue_Hip(CeedVector vec, CeedScalar val) { int ierr; @@ -329,25 +609,34 @@ static int CeedVectorSetValue_Hip(CeedVector vec, CeedScalar val) { ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); // Set value for synced device/host array - if (!impl->d_array && !impl->h_array) { - if (impl->d_array_borrowed) { - impl->d_array = impl->d_array_borrowed; - } else if (impl->h_array_borrowed) { - impl->h_array = impl->h_array_borrowed; - } else if (impl->d_array_owned) { - impl->d_array = impl->d_array_owned; - } else if (impl->h_array_owned) { - impl->h_array = impl->h_array_owned; + if (!impl->d_array.values[CEED_SCALAR_TYPE] && + !impl->h_array.values[CEED_SCALAR_TYPE]) { + if (impl->d_array_borrowed.values[CEED_SCALAR_TYPE]) { + impl->d_array.values[CEED_SCALAR_TYPE] = + impl->d_array_borrowed.values[CEED_SCALAR_TYPE]; + } else if (impl->h_array_borrowed.values[CEED_SCALAR_TYPE]) { + impl->h_array.values[CEED_SCALAR_TYPE] = + impl->h_array_borrowed.values[CEED_SCALAR_TYPE]; + } else if (impl->d_array_owned.values[CEED_SCALAR_TYPE]) { + impl->d_array.values[CEED_SCALAR_TYPE] = + impl->d_array_owned.values[CEED_SCALAR_TYPE]; + } else if (impl->h_array_owned.values[CEED_SCALAR_TYPE]) { + impl->h_array.values[CEED_SCALAR_TYPE] = + impl->h_array_owned.values[CEED_SCALAR_TYPE]; } else { ierr = CeedVectorSetArray(vec, CEED_MEM_DEVICE, CEED_COPY_VALUES, NULL); CeedChkBackend(ierr); } } - if (impl->d_array) { - ierr = CeedDeviceSetValue_Hip(impl->d_array, length, val); CeedChkBackend(ierr); + if (impl->d_array.values[CEED_SCALAR_TYPE]) { + ierr = CeedDeviceSetValue_Hip(impl->d_array.values[CEED_SCALAR_TYPE], length, + val); + CeedChkBackend(ierr); } - if (impl->h_array) { - ierr = CeedHostSetValue_Hip(impl->h_array, length, val); CeedChkBackend(ierr); + if (impl->h_array.values[CEED_SCALAR_TYPE]) { + ierr = CeedHostSetValue_Hip(impl->h_array.values[CEED_SCALAR_TYPE], length, + val); + CeedChkBackend(ierr); } return CEED_ERROR_SUCCESS; @@ -365,24 +654,55 @@ static int CeedVectorTakeArrayGeneric_Hip(CeedVector vec, CeedMemType mem_type, CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - // Sync array to requested mem_type bool need_sync = false; - ierr = CeedVectorNeedSync_Hip(vec, mem_type, &need_sync); CeedChkBackend(ierr); + ierr = CeedVectorNeedSync_Hip(vec, mem_type, &need_sync); + CeedChkBackend(ierr); if (need_sync) { - ierr = CeedVectorSync_Hip(vec, mem_type); CeedChkBackend(ierr); + CeedMemType source_mem_type = CEED_MEM_HOST; + if (mem_type == CEED_MEM_HOST) source_mem_type = CEED_MEM_DEVICE; + // Sync array to requested mem_type + // Figure out which current precision we have to convert from + CeedScalarType source_cur_prec; + ierr = CeedVectorGetPrecision_Hip(vec, source_mem_type, &source_cur_prec); + CeedChkBackend(ierr); + if (source_cur_prec != prec) { + size_t cur_prec_size, prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, source_cur_prec, &cur_prec_size); + CeedChkBackend(ierr); + size_t ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + + // If the size of the current precision's data type is less than + // the destination precision, we want to sync first and then convert (conversion + // handled outside this sync check). + if (cur_prec_size < prec_size) { + ierr = CeedVectorSync_Hip(vec, mem_type, source_cur_prec); CeedChkBackend(ierr); + CeedChkBackend(ierr); + } else { + ierr = CeedVectorConvertArray_Hip(vec, source_mem_type, source_cur_prec, prec); + ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); + } + } else + ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); } + // Check if we need to convert from another precision + CeedScalarType cur_prec; + ierr = CeedVectorGetPrecision_Hip(vec, mem_type, &cur_prec); + CeedChkBackend(ierr); + if (cur_prec != prec) + ierr = CeedVectorConvertArray_Hip(vec, mem_type, cur_prec, prec); // Update pointer switch (mem_type) { case CEED_MEM_HOST: - (*array) = impl->h_array_borrowed; - impl->h_array_borrowed = NULL; - impl->h_array = NULL; + (*array) = impl->h_array_borrowed.values[prec]; + impl->h_array_borrowed.values[prec] = NULL; + impl->h_array.values[prec] = NULL; break; case CEED_MEM_DEVICE: - (*array) = impl->d_array_borrowed; - impl->d_array_borrowed = NULL; - impl->d_array = NULL; + (*array) = impl->d_array_borrowed.values[prec]; + impl->d_array_borrowed.values[prec] = NULL; + impl->d_array.values[prec] = NULL; break; } @@ -404,20 +724,49 @@ static int CeedVectorGetArrayCore_Hip(const CeedVector vec, ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); bool need_sync = false; - ierr = CeedVectorNeedSync_Hip(vec, mem_type, &need_sync); CeedChkBackend(ierr); + ierr = CeedVectorNeedSync_Hip(vec, mem_type, &need_sync); CeedChkBackend(ierr); if (need_sync) { + CeedMemType source_mem_type = CEED_MEM_HOST; + if (mem_type == CEED_MEM_HOST) source_mem_type = CEED_MEM_DEVICE; // Sync array to requested mem_type - ierr = CeedVectorSync_Hip(vec, mem_type); CeedChkBackend(ierr); - } + // Figure out which current precision we have to convert from + CeedScalarType source_cur_prec; + ierr = CeedVectorGetPrecision_Hip(vec, source_mem_type, &source_cur_prec); + CeedChkBackend(ierr); + if (source_cur_prec != prec) { + size_t cur_prec_size, prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, source_cur_prec, &cur_prec_size); + CeedChkBackend(ierr); + size_t ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + // If the size of the current precision's data type is less than + // the destination precision, we want to sync first and then convert (conversion + // handled outside this sync check). + if (cur_prec_size < prec_size) { + ierr = CeedVectorSync_Hip(vec, mem_type, source_cur_prec); CeedChkBackend(ierr); + CeedChkBackend(ierr); + } else { + ierr = CeedVectorConvertArray_Hip(vec, source_mem_type, source_cur_prec, prec); + ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); + } + } else + ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); + } + // Check if we need to convert from another precision + CeedScalarType cur_prec; + ierr = CeedVectorGetPrecision_Hip(vec, mem_type, &cur_prec); + CeedChkBackend(ierr); + if (cur_prec != prec) + ierr = CeedVectorConvertArray_Hip(vec, mem_type, cur_prec, prec); // Update pointer switch (mem_type) { case CEED_MEM_HOST: - *array = impl->h_array; + *array = impl->h_array.values[prec]; break; case CEED_MEM_DEVICE: - *array = impl->d_array; + *array = impl->d_array.values[prec]; break; } @@ -451,10 +800,10 @@ static int CeedVectorGetArrayGeneric_Hip(const CeedVector vec, ierr = CeedVectorSetAllInvalid_Hip(vec); CeedChkBackend(ierr); switch (mem_type) { case CEED_MEM_HOST: - impl->h_array = *array; + impl->h_array.values[prec] = *array; break; case CEED_MEM_DEVICE: - impl->d_array = *array; + impl->d_array.values[prec] = *array; break; } @@ -473,7 +822,7 @@ static int CeedVectorGetArrayWriteGeneric_Hip(const CeedVector vec, ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); bool has_array_of_type = true; - ierr = CeedVectorHasArrayOfType_Hip(vec, mem_type, &has_array_of_type); + ierr = CeedVectorHasArrayOfType_Hip(vec, mem_type, prec, &has_array_of_type); CeedChkBackend(ierr); if (!has_array_of_type) { // Allocate if array is not yet allocated @@ -483,16 +832,16 @@ static int CeedVectorGetArrayWriteGeneric_Hip(const CeedVector vec, // Select dirty array switch (mem_type) { case CEED_MEM_HOST: - if (impl->h_array_borrowed) - impl->h_array = impl->h_array_borrowed; + if (impl->h_array_borrowed.values[prec]) + impl->h_array.values[prec] = impl->h_array_borrowed.values[prec]; else - impl->h_array = impl->h_array_owned; + impl->h_array.values[prec] = impl->h_array_owned.values[prec]; break; case CEED_MEM_DEVICE: - if (impl->d_array_borrowed) - impl->d_array = impl->d_array_borrowed; + if (impl->d_array_borrowed.values[prec]) + impl->d_array.values[prec] = impl->d_array_borrowed.values[prec]; else - impl->d_array = impl->d_array_owned; + impl->d_array.values[prec] = impl->d_array_owned.values[prec]; } } @@ -546,7 +895,9 @@ static int CeedVectorNorm_Hip(CeedVector vec, CeedNormType type, } CeedChk_Hipblas(ceed, ierr); CeedScalar normNoAbs; - ierr = hipMemcpy(&normNoAbs, impl->d_array+indx-1, sizeof(CeedScalar), + ierr = hipMemcpy(&normNoAbs, + (CeedScalar *)(impl->d_array.values[CEED_SCALAR_TYPE])+indx-1, + sizeof(CeedScalar), hipMemcpyDeviceToHost); CeedChk_Hip(ceed, ierr); *norm = fabs(normNoAbs); break; @@ -585,11 +936,15 @@ static int CeedVectorReciprocal_Hip(CeedVector vec) { ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); // Set value for synced device/host array - if (impl->d_array) { - ierr = CeedDeviceReciprocal_Hip(impl->d_array, length); CeedChkBackend(ierr); + if (impl->d_array.values[CEED_SCALAR_TYPE]) { + ierr = CeedDeviceReciprocal_Hip((CeedScalar *) + impl->d_array.values[CEED_SCALAR_TYPE], + length); CeedChkBackend(ierr); } - if (impl->h_array) { - ierr = CeedHostReciprocal_Hip(impl->h_array, length); CeedChkBackend(ierr); + if (impl->h_array.values[CEED_SCALAR_TYPE]) { + ierr = CeedHostReciprocal_Hip((CeedScalar *) + impl->h_array.values[CEED_SCALAR_TYPE], + length); CeedChkBackend(ierr); } return CEED_ERROR_SUCCESS; @@ -624,12 +979,16 @@ static int CeedVectorScale_Hip(CeedVector x, CeedScalar alpha) { ierr = CeedVectorGetLength(x, &length); CeedChkBackend(ierr); // Set value for synced device/host array - if (x_impl->d_array) { - ierr = CeedDeviceScale_Hip(x_impl->d_array, alpha, length); + if (x_impl->d_array.values[CEED_SCALAR_TYPE]) { + ierr = CeedDeviceScale_Hip((CeedScalar *) + x_impl->d_array.values[CEED_SCALAR_TYPE], + alpha, length); CeedChkBackend(ierr); } - if (x_impl->h_array) { - ierr = CeedHostScale_Hip(x_impl->h_array, alpha, length); CeedChkBackend(ierr); + if (x_impl->h_array.values[CEED_SCALAR_TYPE]) { + ierr = CeedHostScale_Hip((CeedScalar *) + x_impl->h_array.values[CEED_SCALAR_TYPE], + alpha, length); CeedChkBackend(ierr); } return CEED_ERROR_SUCCESS; @@ -665,14 +1024,18 @@ static int CeedVectorAXPY_Hip(CeedVector y, CeedScalar alpha, CeedVector x) { ierr = CeedVectorGetLength(y, &length); CeedChkBackend(ierr); // Set value for synced device/host array - if (y_impl->d_array) { + if (y_impl->d_array.values[CEED_SCALAR_TYPE]) { ierr = CeedVectorSyncArray(x, CEED_MEM_DEVICE); CeedChkBackend(ierr); - ierr = CeedDeviceAXPY_Hip(y_impl->d_array, alpha, x_impl->d_array, length); + ierr = CeedDeviceAXPY_Hip((CeedScalar *) + y_impl->d_array.values[CEED_SCALAR_TYPE], + alpha, (CeedScalar *) x_impl->d_array.values[CEED_SCALAR_TYPE], + length); CeedChkBackend(ierr); } - if (y_impl->h_array) { + if (y_impl->h_array.values[CEED_SCALAR_TYPE]) { ierr = CeedVectorSyncArray(x, CEED_MEM_HOST); CeedChkBackend(ierr); - ierr = CeedHostAXPY_Hip(y_impl->h_array, alpha, x_impl->h_array, length); + ierr = CeedHostAXPY_Hip((CeedScalar *) y_impl->h_array.values[CEED_SCALAR_TYPE], + alpha, (CeedScalar *) x_impl->h_array.values[CEED_SCALAR_TYPE], length); CeedChkBackend(ierr); } @@ -711,21 +1074,26 @@ static int CeedVectorPointwiseMult_Hip(CeedVector w, CeedVector x, ierr = CeedVectorGetLength(w, &length); CeedChkBackend(ierr); // Set value for synced device/host array - if (!w_impl->d_array && !w_impl->h_array) { + if (!w_impl->d_array.values[CEED_SCALAR_TYPE] && + !w_impl->h_array.values[CEED_SCALAR_TYPE]) { ierr = CeedVectorSetValue(w, 0.0); CeedChkBackend(ierr); } - if (w_impl->d_array) { + if (w_impl->d_array.values[CEED_SCALAR_TYPE]) { ierr = CeedVectorSyncArray(x, CEED_MEM_DEVICE); CeedChkBackend(ierr); ierr = CeedVectorSyncArray(y, CEED_MEM_DEVICE); CeedChkBackend(ierr); - ierr = CeedDevicePointwiseMult_Hip(w_impl->d_array, x_impl->d_array, - y_impl->d_array, length); + ierr = CeedDevicePointwiseMult_Hip((CeedScalar *) + w_impl->d_array.values[CEED_SCALAR_TYPE], + (CeedScalar *) x_impl->d_array.values[CEED_SCALAR_TYPE], + (CeedScalar *) y_impl->d_array.values[CEED_SCALAR_TYPE], length); CeedChkBackend(ierr); } - if (w_impl->h_array) { + if (w_impl->h_array.values[CEED_SCALAR_TYPE]) { ierr = CeedVectorSyncArray(x, CEED_MEM_HOST); CeedChkBackend(ierr); ierr = CeedVectorSyncArray(y, CEED_MEM_HOST); CeedChkBackend(ierr); - ierr = CeedHostPointwiseMult_Hip(w_impl->h_array, x_impl->h_array, - y_impl->h_array, length); + ierr = CeedHostPointwiseMult_Hip((CeedScalar *) + w_impl->h_array.values[CEED_SCALAR_TYPE], + (CeedScalar *) x_impl->h_array.values[CEED_SCALAR_TYPE], + (CeedScalar *) y_impl->h_array.values[CEED_SCALAR_TYPE], length); CeedChkBackend(ierr); } @@ -742,8 +1110,14 @@ static int CeedVectorDestroy_Hip(const CeedVector vec) { CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - ierr = hipFree(impl->d_array_owned); CeedChk_Hip(ceed, ierr); - ierr = CeedFree(&impl->h_array_owned); CeedChkBackend(ierr); + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + if (impl->d_array_owned.values[i]) { + ierr = hipFree(impl->d_array_owned.values[i]); CeedChk_Hip(ceed, ierr); + } + if (impl->h_array_owned.values[i]) { + ierr = CeedFree(&impl->h_array_owned.values[i]); CeedChkBackend(ierr); + } + } ierr = CeedFree(&impl); CeedChkBackend(ierr); return CEED_ERROR_SUCCESS; diff --git a/backends/hip-ref/ceed-hip-ref.h b/backends/hip-ref/ceed-hip-ref.h index eb54806aee..845b1e537d 100644 --- a/backends/hip-ref/ceed-hip-ref.h +++ b/backends/hip-ref/ceed-hip-ref.h @@ -15,12 +15,12 @@ #include "../hip/ceed-hip-common.h" typedef struct { - CeedScalar *h_array; - CeedScalar *h_array_borrowed; - CeedScalar *h_array_owned; - CeedScalar *d_array; - CeedScalar *d_array_borrowed; - CeedScalar *d_array_owned; + CeedScalarArray h_array; + CeedScalarArray h_array_borrowed; + CeedScalarArray h_array_owned; + CeedScalarArray d_array; + CeedScalarArray d_array_borrowed; + CeedScalarArray d_array_owned; } CeedVector_Hip; typedef struct { diff --git a/backends/hip-ref/kernels/hip-ref-vector.hip.cpp b/backends/hip-ref/kernels/hip-ref-vector.hip.cpp index 7c5525b953..de9c581a60 100644 --- a/backends/hip-ref/kernels/hip-ref-vector.hip.cpp +++ b/backends/hip-ref/kernels/hip-ref-vector.hip.cpp @@ -34,6 +34,61 @@ extern "C" int CeedDeviceSetValue_Hip(CeedScalar* d_array, CeedInt length, return 0; } +//------------------------------------------------------------------------------ +// Kernel for converting double to single +//------------------------------------------------------------------------------ +__global__ static void convertFp64Fp32(CeedInt length, double* double_data, + float* float_data) { + int idx = threadIdx.x + blockDim.x * blockIdx.x; + if (idx >= length) + return; + float_data[idx] = (float) double_data[idx]; +} + +//------------------------------------------------------------------------------ +// Convert a double-precision array to single precision +//------------------------------------------------------------------------------ +extern "C" int CeedDeviceConvertArray_Hip_Fp64_Fp32(CeedInt length, + double* double_data, + float* float_data) { + const int bsize = 512; + const int vecsize = length; + int gridsize = vecsize / bsize; + + if (bsize * gridsize < vecsize) + gridsize += 1; + convertFp64Fp32<<>>(length, double_data, float_data); + return 0; +} + +//------------------------------------------------------------------------------ +// Kernel for converting single to double +//------------------------------------------------------------------------------ +__global__ static void convertFp32Fp64(CeedInt length, float* float_data, + double* double_data) { + int idx = threadIdx.x + blockDim.x * blockIdx.x; + if (idx >= length) + return; + double_data[idx] = (double) float_data[idx]; +} + +//------------------------------------------------------------------------------ +// Convert a single-precision array to double precision +//------------------------------------------------------------------------------ +extern "C" int CeedDeviceConvertArray_Hip_Fp32_Fp64(CeedInt length, + float* float_data, + double* double_data) { + const int bsize = 512; + const int vecsize = length; + int gridsize = vecsize / bsize; + + if (bsize * gridsize < vecsize) + gridsize += 1; + convertFp32Fp64<<>>(length, float_data, double_data); + return 0; + +} + //------------------------------------------------------------------------------ // Kernel for taking reciprocal //------------------------------------------------------------------------------ diff --git a/include/ceed/ceed.h b/include/ceed/ceed.h index 2f827c81d4..217b3204fc 100644 --- a/include/ceed/ceed.h +++ b/include/ceed/ceed.h @@ -140,7 +140,6 @@ typedef int32_t CeedInt; typedef ptrdiff_t CeedSize; /// Scalar (floating point) types -/// /// @ingroup Ceed typedef enum { /// Single precision @@ -148,6 +147,13 @@ typedef enum { /// Double precision CEED_SCALAR_FP64 } CeedScalarType; +/// Total number of allowed scalar precision types (size of CeedScalarType enum) +#define CEED_NUM_PRECISIONS 2 +/// Struct for holding data in multiple precisions for mixed-precision-enabled +/// backends +typedef struct { + void *values[2]; // Size equals CEED_NUM_PRECISIONS +} CeedScalarArray; /// Base scalar type for the library to use: change which header is /// included to change the precision. #include "ceed-f64.h" From 3b67d1a67676bbca94331157d436c579ee552f95 Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Wed, 20 Apr 2022 15:17:35 -0600 Subject: [PATCH 03/10] WIP hip-ref: use backend fcn for sync, streamline logic --- backends/cuda-ref/ceed-cuda-vector.c | 2 +- backends/hip-ref/ceed-hip-ref-vector.c | 572 +++++++++++++------------ interface/ceed.c | 1 + 3 files changed, 306 insertions(+), 269 deletions(-) diff --git a/backends/cuda-ref/ceed-cuda-vector.c b/backends/cuda-ref/ceed-cuda-vector.c index 5ed7229ae1..8fbbdec739 100644 --- a/backends/cuda-ref/ceed-cuda-vector.c +++ b/backends/cuda-ref/ceed-cuda-vector.c @@ -88,7 +88,7 @@ static inline int CeedVectorSyncD2H_Cuda(const CeedVector vec) { //------------------------------------------------------------------------------ // Sync arrays //------------------------------------------------------------------------------ -static inline int CeedVectorSyncGeneric_Cuda(const CeedVector vec, +static inline int CeedVectorSync_Cuda(const CeedVector vec, CeedScalarType prec, CeedMemType mem_type) { switch (mem_type) { diff --git a/backends/hip-ref/ceed-hip-ref-vector.c b/backends/hip-ref/ceed-hip-ref-vector.c index be042ffb9c..7e07b7d8db 100644 --- a/backends/hip-ref/ceed-hip-ref-vector.c +++ b/backends/hip-ref/ceed-hip-ref-vector.c @@ -14,7 +14,8 @@ #include "ceed-hip-ref.h" //------------------------------------------------------------------------------ -// Sync host to device +// Get size of the scalar type +// TODO: move to interface level for all backends? //------------------------------------------------------------------------------ static inline int CeedScalarTypeGetSize_Hip(Ceed ceed, CeedScalarType prec, size_t *size) { @@ -34,103 +35,150 @@ static inline int CeedScalarTypeGetSize_Hip(Ceed ceed, CeedScalarType prec, return CEED_ERROR_SUCCESS; } - //------------------------------------------------------------------------------ -// Sync host to device +// Set all pointers as invalid //------------------------------------------------------------------------------ -static inline int CeedVectorSyncH2D_Hip(const CeedVector vec, - const CeedScalarType prec) { +static inline int CeedVectorSetAllInvalid_Hip(const CeedVector vec) { int ierr; - Ceed ceed; - ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - CeedSize length; - ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - size_t prec_size; - ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); - CeedChkBackend(ierr); - size_t bytes = length * prec_size; + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + impl->h_array.values[i] = NULL; + impl->d_array.values[i] = NULL; + } - if (!impl->h_array.values[prec]) - // LCOV_EXCL_START - return CeedError(ceed, CEED_ERROR_BACKEND, - "No valid host data to sync to device"); - // LCOV_EXCL_STOP + return CEED_ERROR_SUCCESS; +} - if (impl->d_array_borrowed.values[prec]) { - impl->d_array.values[prec] = impl->d_array_borrowed.values[prec]; - } else if (impl->d_array_owned.values[prec]) { - impl->d_array.values[prec] = impl->d_array_owned.values[prec]; - } else { - ierr = hipMalloc((void **)&impl->d_array_owned.values[prec], bytes); - CeedChk_Hip(ceed, ierr); - impl->d_array.values[prec] = impl->d_array_owned.values[prec]; - } - ierr = hipMemcpy(impl->d_array.values[prec], impl->h_array.values[prec], - bytes, hipMemcpyHostToDevice); CeedChk_Hip(ceed, ierr); +//------------------------------------------------------------------------------ +// Check if CeedVector has any valid pointers +//------------------------------------------------------------------------------ +static inline int CeedVectorHasValidArray_Hip(const CeedVector vec, + bool *has_valid_array) { + int ierr; + CeedVector_Hip *impl; + ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + + *has_valid_array = false; + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + *has_valid_array = *has_valid_array || + (!!impl->h_array.values[i] || !!impl->d_array.values[i]); + } return CEED_ERROR_SUCCESS; } //------------------------------------------------------------------------------ -// Sync device to host +// Check if has valid array of given memory type //------------------------------------------------------------------------------ -static inline int CeedVectorSyncD2H_Hip(const CeedVector vec, - const CeedScalarType prec) { +static inline int CeedVectorHasValidArrayOfMemType_Hip(const CeedVector vec, + CeedMemType mem_type, bool *has_valid_array_of_mem_type) { int ierr; - Ceed ceed; - ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - if (!impl->d_array.values[prec]) - // LCOV_EXCL_START - return CeedError(ceed, CEED_ERROR_BACKEND, - "No valid device data to sync to host"); - // LCOV_EXCL_STOP + *has_valid_array_of_mem_type = false; + switch (mem_type) { + case CEED_MEM_HOST: + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + *has_valid_array_of_mem_type = *has_valid_array_of_mem_type || + !!impl->h_array.values[i]; + } + break; + case CEED_MEM_DEVICE: + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + *has_valid_array_of_mem_type = *has_valid_array_of_mem_type || + !!impl->d_array.values[i]; + } + break; + } - CeedSize length; - ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - size_t prec_size; - ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); - CeedChkBackend(ierr); - size_t bytes = length * prec_size; + return CEED_ERROR_SUCCESS; +} - if (impl->h_array_borrowed.values[prec]) { - impl->h_array.values[prec] = impl->h_array_borrowed.values[prec]; - } else if (impl->h_array_owned.values[prec]) { - impl->h_array.values[prec] = impl->h_array_owned.values[prec]; - } else { - CeedSize length; - ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); - ierr = CeedCallocArray(length, prec_size,&impl->h_array_owned.values[prec]); - CeedChkBackend(ierr); - impl->h_array.values[prec] = impl->h_array_owned.values[prec]; - } +//------------------------------------------------------------------------------ +// Check if has any array of given type +//------------------------------------------------------------------------------ +static inline int CeedVectorHasArrayOfType_Hip(const CeedVector vec, + CeedMemType mem_type, CeedScalarType prec, bool *has_array_of_type) { + int ierr; + CeedVector_Hip *impl; + ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - ierr = hipMemcpy(impl->h_array.values[prec], impl->d_array.values[prec], - bytes, hipMemcpyDeviceToHost); CeedChk_Hip(ceed, ierr); + switch (mem_type) { + case CEED_MEM_HOST: + *has_array_of_type = !!impl->h_array_borrowed.values[prec] || + !!impl->h_array_owned.values[prec]; + break; + case CEED_MEM_DEVICE: + *has_array_of_type = !!impl->d_array_borrowed.values[prec] || + !!impl->d_array_owned.values[prec]; + break; + } return CEED_ERROR_SUCCESS; } //------------------------------------------------------------------------------ -// Sync arrays +// Check if has borrowed array of given type //------------------------------------------------------------------------------ -static inline int CeedVectorSync_Hip(const CeedVector vec, - CeedMemType mem_type, - CeedScalarType prec) { +static inline int CeedVectorHasBorrowedArrayOfType_Hip(const CeedVector vec, + CeedMemType mem_type, CeedScalarType prec, + bool *has_borrowed_array_of_type) { + int ierr; + CeedVector_Hip *impl; + ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + switch (mem_type) { - case CEED_MEM_HOST: return CeedVectorSyncD2H_Hip(vec, prec); - case CEED_MEM_DEVICE: return CeedVectorSyncH2D_Hip(vec, prec); + case CEED_MEM_HOST: + *has_borrowed_array_of_type = !!impl->h_array_borrowed.values[prec]; + break; + case CEED_MEM_DEVICE: + *has_borrowed_array_of_type = !!impl->d_array_borrowed.values[prec]; + break; } - return CEED_ERROR_UNSUPPORTED; + + return CEED_ERROR_SUCCESS; } +//------------------------------------------------------------------------------ +// Return the scalar type of the valid array on mem_type, or the "preferred +// precision" for copying, if more than one precision is valid. If no +// precisions are valid on the specified mem_type, it will return +// CEED_SCALAR_TYPE (default precision); you should check for a valid array +// separately. +//------------------------------------------------------------------------------ +static inline int CeedVectorGetPrecision_Hip(const CeedVector vec, + const CeedMemType mem_type, CeedScalarType *preferred_precision) { + + int ierr; + CeedVector_Hip *impl; + ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + + *preferred_precision = CEED_SCALAR_TYPE; + // Check for valid precisions, from most to least precise precise (we want + // the most precision if multiple arrays are valid) + switch (mem_type) { + case CEED_MEM_HOST: + if (!!impl->h_array.values[CEED_SCALAR_FP64]) + *preferred_precision = CEED_SCALAR_FP64; + else if (!!impl->h_array.values[CEED_SCALAR_FP32]) + *preferred_precision = CEED_SCALAR_FP32; + break; + case CEED_MEM_DEVICE: + if (!!impl->d_array.values[CEED_SCALAR_FP64]) + *preferred_precision = CEED_SCALAR_FP64; + else if (!!impl->d_array.values[CEED_SCALAR_FP32]) + *preferred_precision = CEED_SCALAR_FP32; + break; + } + + return CEED_ERROR_SUCCESS; +} + //------------------------------------------------------------------------------ // Convert vector's host array to new precision. //------------------------------------------------------------------------------ @@ -151,14 +199,20 @@ static int CeedVectorConvertArrayHost_Hip(CeedVector vec, break; case CEED_SCALAR_FP32: if (!data->h_array.values[CEED_SCALAR_FP32]) { - if (!data->h_array_owned.values[CEED_SCALAR_FP32]) { - ierr = CeedMalloc(length, - (float **) &data->h_array_owned.values[CEED_SCALAR_FP32]); - CeedChkBackend(ierr); + // Use borrowed memory, if we have it for this precision + if (data->h_array_borrowed.values[CEED_SCALAR_FP32]) { + data->h_array.values[CEED_SCALAR_FP32] = + data->h_array_borrowed.values[CEED_SCALAR_FP32]; + } else { + // Use owned memory + if (!data->h_array_owned.values[CEED_SCALAR_FP32]) { + ierr = CeedMalloc(length, + (float **) &data->h_array_owned.values[CEED_SCALAR_FP32]); + CeedChkBackend(ierr); + } + data->h_array.values[CEED_SCALAR_FP32] = + data->h_array_owned.values[CEED_SCALAR_FP32]; } - // Use owned memory - data->h_array.values[CEED_SCALAR_FP32] = - data->h_array_owned.values[CEED_SCALAR_FP32]; } float *float_data = (float *) data->h_array.values[CEED_SCALAR_FP32]; double *double_data = (double *) data->h_array.values[CEED_SCALAR_FP64]; @@ -172,14 +226,20 @@ static int CeedVectorConvertArrayHost_Hip(CeedVector vec, switch (to_prec) { case CEED_SCALAR_FP64: if (!data->h_array.values[CEED_SCALAR_FP64]) { - if (!data->h_array_owned.values[CEED_SCALAR_FP64]) { - ierr = CeedMalloc(length, - (double **) &data->h_array_owned.values[CEED_SCALAR_FP64]); - CeedChkBackend(ierr); + // Use borrowed memory, if we have it for this precision + if (data->h_array_borrowed.values[CEED_SCALAR_FP64]) { + data->h_array.values[CEED_SCALAR_FP64] = + data->h_array_borrowed.values[CEED_SCALAR_FP64]; + } else { + // Use owned memory + if (!data->h_array_owned.values[CEED_SCALAR_FP64]) { + ierr = CeedMalloc(length, + (double **) &data->h_array_owned.values[CEED_SCALAR_FP64]); + CeedChkBackend(ierr); + } + data->h_array.values[CEED_SCALAR_FP64] = + data->h_array_owned.values[CEED_SCALAR_FP64]; } - // Use owned memory - data->h_array.values[CEED_SCALAR_FP64] = - data->h_array_owned.values[CEED_SCALAR_FP64]; } float *float_data = (float *) data->h_array.values[CEED_SCALAR_FP32]; double *double_data = (double *) data->h_array.values[CEED_SCALAR_FP64]; @@ -230,15 +290,21 @@ static int CeedVectorConvertArrayDevice_Hip(CeedVector vec, break; case CEED_SCALAR_FP32: if (!data->d_array.values[CEED_SCALAR_FP32]) { - if (!data->d_array_owned.values[CEED_SCALAR_FP32]) { - size_t bytes = length * sizeof(float); - ierr = hipMalloc((void **)&data->d_array_owned.values[CEED_SCALAR_FP32], - bytes); - CeedChk_Hip(ceed, ierr); + // Use borrowed memory, if we have it for this precision + if (data->d_array_borrowed.values[CEED_SCALAR_FP32]) { + data->d_array.values[CEED_SCALAR_FP32] = + data->d_array_borrowed.values[CEED_SCALAR_FP32]; + } else { + // Use owned memory + if (!data->d_array_owned.values[CEED_SCALAR_FP32]) { + size_t bytes = length * sizeof(float); + ierr = hipMalloc((void **)&data->d_array_owned.values[CEED_SCALAR_FP32], + bytes); + CeedChk_Hip(ceed, ierr); + } + data->d_array.values[CEED_SCALAR_FP32] = + data->d_array_owned.values[CEED_SCALAR_FP32]; } - // Use owned memory - data->d_array.values[CEED_SCALAR_FP32] = - data->d_array_owned.values[CEED_SCALAR_FP32]; } ierr = CeedDeviceConvertArray_Hip_Fp64_Fp32(length, (double *) data->d_array.values[CEED_SCALAR_FP64], @@ -252,15 +318,21 @@ static int CeedVectorConvertArrayDevice_Hip(CeedVector vec, switch (to_prec) { case CEED_SCALAR_FP64: if (!data->d_array.values[CEED_SCALAR_FP64]) { - if (!data->d_array_owned.values[CEED_SCALAR_FP64]) { - size_t bytes = length * sizeof(double); - ierr = hipMalloc((void **)&data->d_array_owned.values[CEED_SCALAR_FP64], - bytes); - CeedChk_Hip(ceed, ierr); + // Use borrowed memory, if we have it for this precision + if (data->d_array_borrowed.values[CEED_SCALAR_FP64]) { + data->d_array.values[CEED_SCALAR_FP64] = + data->d_array_borrowed.values[CEED_SCALAR_FP64]; + } else { + // Use owned memory + if (!data->d_array_owned.values[CEED_SCALAR_FP64]) { + size_t bytes = length * sizeof(double); + ierr = hipMalloc((void **)&data->d_array_owned.values[CEED_SCALAR_FP64], + bytes); + CeedChk_Hip(ceed, ierr); + } + data->d_array.values[CEED_SCALAR_FP64] = + data->d_array_owned.values[CEED_SCALAR_FP64]; } - // Use owned memory - data->d_array.values[CEED_SCALAR_FP64] = - data->d_array_owned.values[CEED_SCALAR_FP64]; } ierr = CeedDeviceConvertArray_Hip_Fp32_Fp64(length, (float *) data->d_array.values[CEED_SCALAR_FP32], @@ -294,166 +366,177 @@ static int CeedVectorConvertArray_Hip(CeedVector vec, } //------------------------------------------------------------------------------ -// Set all pointers as invalid +// Sync host to device //------------------------------------------------------------------------------ -static inline int CeedVectorSetAllInvalid_Hip(const CeedVector vec) { +static inline int CeedVectorSyncH2D_Hip(const CeedVector vec, + const CeedScalarType prec) { int ierr; + Ceed ceed; + ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { - impl->h_array.values[i] = NULL; - impl->d_array.values[i] = NULL; - } - - return CEED_ERROR_SUCCESS; -} - -//------------------------------------------------------------------------------ -// Return the scalar type of the valid array on mem_type, or the "preferred -// precision" for copying, if more than one precision is valid. If no -// precisions are valid on the specified mem_type, it will return -// CEED_SCALAR_TYPE (default precision); you should check for a valid array -// separately. -//------------------------------------------------------------------------------ -static inline int CeedVectorGetPrecision_Hip(const CeedVector vec, - const CeedMemType mem_type, CeedScalarType *preferred_precision) { + CeedSize length; + ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); + size_t prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + size_t bytes = length * prec_size; - int ierr; - CeedVector_Hip *impl; - ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + if (!impl->h_array.values[prec]) + // LCOV_EXCL_START + return CeedError(ceed, CEED_ERROR_BACKEND, + "No valid host data to sync to device"); + // LCOV_EXCL_STOP - *preferred_precision = CEED_SCALAR_TYPE; - // Check for valid precisions, from most to least precise precise (we want - // the most precision if multiple arrays are valid) - switch (mem_type) { - case CEED_MEM_HOST: - if (!!impl->h_array.values[CEED_SCALAR_FP64]) - *preferred_precision = CEED_SCALAR_FP64; - else if (!!impl->h_array.values[CEED_SCALAR_FP32]) - *preferred_precision = CEED_SCALAR_FP32; - break; - case CEED_MEM_DEVICE: - if (!!impl->d_array.values[CEED_SCALAR_FP64]) - *preferred_precision = CEED_SCALAR_FP64; - else if (!!impl->d_array.values[CEED_SCALAR_FP32]) - *preferred_precision = CEED_SCALAR_FP32; - break; + if (impl->d_array_borrowed.values[prec]) { + impl->d_array.values[prec] = impl->d_array_borrowed.values[prec]; + } else if (impl->d_array_owned.values[prec]) { + impl->d_array.values[prec] = impl->d_array_owned.values[prec]; + } else { + ierr = hipMalloc((void **)&impl->d_array_owned.values[prec], bytes); + CeedChk_Hip(ceed, ierr); + impl->d_array.values[prec] = impl->d_array_owned.values[prec]; } + ierr = hipMemcpy(impl->d_array.values[prec], impl->h_array.values[prec], + bytes, hipMemcpyHostToDevice); CeedChk_Hip(ceed, ierr); + return CEED_ERROR_SUCCESS; } - //------------------------------------------------------------------------------ -// Check if CeedVector has any valid pointers +// Sync device to host //------------------------------------------------------------------------------ -static inline int CeedVectorHasValidArray_Hip(const CeedVector vec, - bool *has_valid_array) { +static inline int CeedVectorSyncD2H_Hip(const CeedVector vec, + const CeedScalarType prec) { int ierr; + Ceed ceed; + ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - *has_valid_array = false; - for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { - *has_valid_array = *has_valid_array || - (!!impl->h_array.values[i] || !!impl->d_array.values[i]); + if (!impl->d_array.values[prec]) + // LCOV_EXCL_START + return CeedError(ceed, CEED_ERROR_BACKEND, + "No valid device data to sync to host"); + // LCOV_EXCL_STOP + + CeedSize length; + ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); + size_t prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); + size_t bytes = length * prec_size; + + if (impl->h_array_borrowed.values[prec]) { + impl->h_array.values[prec] = impl->h_array_borrowed.values[prec]; + } else if (impl->h_array_owned.values[prec]) { + impl->h_array.values[prec] = impl->h_array_owned.values[prec]; + } else { + CeedSize length; + ierr = CeedVectorGetLength(vec, &length); CeedChkBackend(ierr); + ierr = CeedCallocArray(length, prec_size,&impl->h_array_owned.values[prec]); + CeedChkBackend(ierr); + impl->h_array.values[prec] = impl->h_array_owned.values[prec]; } + ierr = hipMemcpy(impl->h_array.values[prec], impl->d_array.values[prec], + bytes, hipMemcpyDeviceToHost); CeedChk_Hip(ceed, ierr); + return CEED_ERROR_SUCCESS; } //------------------------------------------------------------------------------ -// Check if has valid array of given memory type +// Check if the only current valid array is on another MemType than mem_type //------------------------------------------------------------------------------ -static inline int CeedVectorHasValidArrayOfMemType_Hip(const CeedVector vec, - CeedMemType mem_type, bool *has_valid_array_of_mem_type) { +static inline int CeedVectorNeedSync_Hip(const CeedVector vec, + CeedMemType mem_type, bool *need_sync) { int ierr; CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - *has_valid_array_of_mem_type = false; - switch (mem_type) { - case CEED_MEM_HOST: - for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { - *has_valid_array_of_mem_type = *has_valid_array_of_mem_type || - !!impl->h_array.values[i]; - } - break; - case CEED_MEM_DEVICE: - for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { - *has_valid_array_of_mem_type = *has_valid_array_of_mem_type || - !!impl->d_array.values[i]; - } - break; - } + bool has_valid_array = false; + ierr = CeedVectorHasValidArray(vec, &has_valid_array); CeedChkBackend(ierr); + bool has_valid_array_of_mem_type = false; + ierr = CeedVectorHasValidArrayOfMemType_Hip(vec, mem_type, + &has_valid_array_of_mem_type); + CeedChkBackend(ierr); + + // Check if we have a valid array, but not for the correct memory type + *need_sync = has_valid_array && !has_valid_array_of_mem_type; return CEED_ERROR_SUCCESS; } //------------------------------------------------------------------------------ -// Check if has any array of given type +// Sync arrays between host and device //------------------------------------------------------------------------------ -static inline int CeedVectorHasArrayOfType_Hip(const CeedVector vec, - CeedMemType mem_type, CeedScalarType prec, bool *has_array_of_type) { +static int CeedVectorSyncArrayGeneric_Hip(const CeedVector vec, + CeedMemType mem_type, + CeedScalarType prec) { + int ierr; - CeedVector_Hip *impl; - ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - switch (mem_type) { - case CEED_MEM_HOST: - *has_array_of_type = !!impl->h_array_borrowed.values[prec] || - !!impl->h_array_owned.values[prec]; - break; - case CEED_MEM_DEVICE: - *has_array_of_type = !!impl->d_array_borrowed.values[prec] || - !!impl->d_array_owned.values[prec]; - break; - } + // Check whether device/host sync is needed + bool need_sync = false; + ierr = CeedVectorNeedSync_Hip(vec, mem_type, &need_sync); + CeedChkBackend(ierr); + if (!need_sync) + return CEED_ERROR_SUCCESS; - return CEED_ERROR_SUCCESS; -} + Ceed ceed; + ierr = CeedVectorGetCeed(vec, &ceed); CeedChkBackend(ierr); + CeedMemType source_mem_type = CEED_MEM_HOST; + if (mem_type == CEED_MEM_HOST) source_mem_type = CEED_MEM_DEVICE; + // Sync array to requested mem_type + // Figure out which current precision we have to convert from + CeedScalarType source_cur_prec; + ierr = CeedVectorGetPrecision_Hip(vec, source_mem_type, &source_cur_prec); + CeedChkBackend(ierr); + bool need_convert = false; + CeedScalarType sync_prec = prec; + if (source_cur_prec != prec) { + size_t cur_prec_size, prec_size; + ierr = CeedScalarTypeGetSize_Hip(ceed, source_cur_prec, &cur_prec_size); + CeedChkBackend(ierr); + size_t ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); + CeedChkBackend(ierr); -//------------------------------------------------------------------------------ -// Check if has borrowed array of given type -//------------------------------------------------------------------------------ -static inline int CeedVectorHasBorrowedArrayOfType_Hip(const CeedVector vec, - CeedMemType mem_type, CeedScalarType prec, - bool *has_borrowed_array_of_type) { - int ierr; - CeedVector_Hip *impl; - ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + // If the size of the current precision's data type is greater than + // the destination precision, we want to convert first, then sync, + // to reduce size of memory movement between host and device + if (cur_prec_size > prec_size) { + ierr = CeedVectorConvertArray_Hip(vec, source_mem_type, source_cur_prec, prec); + CeedChkBackend(ierr); + } + // Else, we will sync first, then convert + else { + sync_prec = source_cur_prec; + need_convert = true; + } + } + // Perform sync between host and device in destination precision switch (mem_type) { case CEED_MEM_HOST: - *has_borrowed_array_of_type = !!impl->h_array_borrowed.values[prec]; + ierr = CeedVectorSyncD2H_Hip(vec, sync_prec); CeedChkBackend(ierr); break; case CEED_MEM_DEVICE: - *has_borrowed_array_of_type = !!impl->d_array_borrowed.values[prec]; + ierr = CeedVectorSyncH2D_Hip(vec, sync_prec); CeedChkBackend(ierr); break; + default: + // LCOV_EXCL_START + return CeedError(ceed, CEED_ERROR_BACKEND, + "Invalid memory type specified"); + // LCOV_EXCL_STOP } - return CEED_ERROR_SUCCESS; -} - -//------------------------------------------------------------------------------ -// Check if the only current valid array is on another MemType than mem_type -//------------------------------------------------------------------------------ -static inline int CeedVectorNeedSync_Hip(const CeedVector vec, - CeedMemType mem_type, bool *need_sync) { - int ierr; - CeedVector_Hip *impl; - ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - - bool has_valid_array = false; - ierr = CeedVectorHasValidArray(vec, &has_valid_array); CeedChkBackend(ierr); - bool has_valid_array_of_mem_type = false; - ierr = CeedVectorHasValidArrayOfMemType_Hip(vec, mem_type, - &has_valid_array_of_mem_type); - CeedChkBackend(ierr); - - // Check if we have a valid array, but not for the correct memory type - *need_sync = has_valid_array && !has_valid_array_of_mem_type; + // Perform conversion, if still necessary + if (need_convert) { + ierr = CeedVectorConvertArray_Hip(vec, mem_type, source_cur_prec, prec); + CeedChkBackend(ierr); + } return CEED_ERROR_SUCCESS; } @@ -654,43 +737,18 @@ static int CeedVectorTakeArrayGeneric_Hip(CeedVector vec, CeedMemType mem_type, CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - bool need_sync = false; - ierr = CeedVectorNeedSync_Hip(vec, mem_type, &need_sync); + // Sync host/device (if necessary, otherwise the function will return) + ierr = CeedVectorSyncArrayGeneric_Hip(vec, mem_type, prec); CeedChkBackend(ierr); - if (need_sync) { - CeedMemType source_mem_type = CEED_MEM_HOST; - if (mem_type == CEED_MEM_HOST) source_mem_type = CEED_MEM_DEVICE; - // Sync array to requested mem_type - // Figure out which current precision we have to convert from - CeedScalarType source_cur_prec; - ierr = CeedVectorGetPrecision_Hip(vec, source_mem_type, &source_cur_prec); - CeedChkBackend(ierr); - if (source_cur_prec != prec) { - size_t cur_prec_size, prec_size; - ierr = CeedScalarTypeGetSize_Hip(ceed, source_cur_prec, &cur_prec_size); - CeedChkBackend(ierr); - size_t ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); - CeedChkBackend(ierr); - // If the size of the current precision's data type is less than - // the destination precision, we want to sync first and then convert (conversion - // handled outside this sync check). - if (cur_prec_size < prec_size) { - ierr = CeedVectorSync_Hip(vec, mem_type, source_cur_prec); CeedChkBackend(ierr); - CeedChkBackend(ierr); - } else { - ierr = CeedVectorConvertArray_Hip(vec, source_mem_type, source_cur_prec, prec); - ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); - } - } else - ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); - } // Check if we need to convert from another precision CeedScalarType cur_prec; ierr = CeedVectorGetPrecision_Hip(vec, mem_type, &cur_prec); CeedChkBackend(ierr); - if (cur_prec != prec) + if (cur_prec != prec) { ierr = CeedVectorConvertArray_Hip(vec, mem_type, cur_prec, prec); + CeedChkBackend(ierr); + } // Update pointer switch (mem_type) { @@ -723,43 +781,19 @@ static int CeedVectorGetArrayCore_Hip(const CeedVector vec, CeedVector_Hip *impl; ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); - bool need_sync = false; - ierr = CeedVectorNeedSync_Hip(vec, mem_type, &need_sync); + // Sync host/device (if necessary, otherwise the function will return) + ierr = CeedVectorSyncArrayGeneric_Hip(vec, mem_type, prec); CeedChkBackend(ierr); - if (need_sync) { - CeedMemType source_mem_type = CEED_MEM_HOST; - if (mem_type == CEED_MEM_HOST) source_mem_type = CEED_MEM_DEVICE; - // Sync array to requested mem_type - // Figure out which current precision we have to convert from - CeedScalarType source_cur_prec; - ierr = CeedVectorGetPrecision_Hip(vec, source_mem_type, &source_cur_prec); - CeedChkBackend(ierr); - if (source_cur_prec != prec) { - size_t cur_prec_size, prec_size; - ierr = CeedScalarTypeGetSize_Hip(ceed, source_cur_prec, &cur_prec_size); - CeedChkBackend(ierr); - size_t ierr = CeedScalarTypeGetSize_Hip(ceed, prec, &prec_size); - CeedChkBackend(ierr); - // If the size of the current precision's data type is less than - // the destination precision, we want to sync first and then convert (conversion - // handled outside this sync check). - if (cur_prec_size < prec_size) { - ierr = CeedVectorSync_Hip(vec, mem_type, source_cur_prec); CeedChkBackend(ierr); - CeedChkBackend(ierr); - } else { - ierr = CeedVectorConvertArray_Hip(vec, source_mem_type, source_cur_prec, prec); - ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); - } - } else - ierr = CeedVectorSync_Hip(vec, mem_type, prec); CeedChkBackend(ierr); - } // Check if we need to convert from another precision CeedScalarType cur_prec; ierr = CeedVectorGetPrecision_Hip(vec, mem_type, &cur_prec); CeedChkBackend(ierr); - if (cur_prec != prec) + if (cur_prec != prec) { ierr = CeedVectorConvertArray_Hip(vec, mem_type, cur_prec, prec); + CeedChkBackend(ierr); + } + // Update pointer switch (mem_type) { case CEED_MEM_HOST: @@ -1143,6 +1177,8 @@ int CeedVectorCreate_Hip(CeedSize n, CeedVector vec) { CeedVectorTakeArrayGeneric_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetValue", (int (*)())(CeedVectorSetValue_Hip)); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SyncArrayGeneric", + CeedVectorSyncArrayGeneric_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayGeneric", CeedVectorGetArrayGeneric_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayReadGeneric", diff --git a/interface/ceed.c b/interface/ceed.c index bb46ddcda8..646f26e193 100644 --- a/interface/ceed.c +++ b/interface/ceed.c @@ -842,6 +842,7 @@ int CeedInit(const char *resource, Ceed *ceed) { CEED_FTABLE_ENTRY(CeedVector, SetArrayGeneric), CEED_FTABLE_ENTRY(CeedVector, TakeArrayGeneric), CEED_FTABLE_ENTRY(CeedVector, SetValue), + CEED_FTABLE_ENTRY(CeedVector, SyncArrayGeneric), CEED_FTABLE_ENTRY(CeedVector, GetArrayGeneric), CEED_FTABLE_ENTRY(CeedVector, GetArrayReadGeneric), CEED_FTABLE_ENTRY(CeedVector, GetArrayWriteGeneric), From 88a3338fb59f21732f37b26ed988807d884e07c7 Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Wed, 20 Apr 2022 15:37:44 -0600 Subject: [PATCH 04/10] WIP: make style --- backends/cuda-ref/ceed-cuda-vector.c | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/backends/cuda-ref/ceed-cuda-vector.c b/backends/cuda-ref/ceed-cuda-vector.c index 8fbbdec739..c67db91f71 100644 --- a/backends/cuda-ref/ceed-cuda-vector.c +++ b/backends/cuda-ref/ceed-cuda-vector.c @@ -89,8 +89,8 @@ static inline int CeedVectorSyncD2H_Cuda(const CeedVector vec) { // Sync arrays //------------------------------------------------------------------------------ static inline int CeedVectorSync_Cuda(const CeedVector vec, - CeedScalarType prec, - CeedMemType mem_type) { + CeedScalarType prec, + CeedMemType mem_type) { switch (mem_type) { case CEED_MEM_HOST: return CeedVectorSyncD2H_Cuda(vec); case CEED_MEM_DEVICE: return CeedVectorSyncH2D_Cuda(vec); From 3e94c0d61c1d661913bcb4d958cf15df49c61ef6 Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Wed, 20 Apr 2022 16:05:08 -0600 Subject: [PATCH 05/10] Add specific FP32/FP64 Vector access functions to interface --- include/ceed/ceed.h | 28 ++++ interface/ceed-vector.c | 292 ++++++++++++++++++++++++++++++++++++++++ 2 files changed, 320 insertions(+) diff --git a/include/ceed/ceed.h b/include/ceed/ceed.h index 217b3204fc..498b51e570 100644 --- a/include/ceed/ceed.h +++ b/include/ceed/ceed.h @@ -357,19 +357,47 @@ CEED_EXTERN int CeedVectorCreate(Ceed ceed, CeedSize len, CeedVector *vec); CEED_EXTERN int CeedVectorReferenceCopy(CeedVector vec, CeedVector *vec_copy); CEED_EXTERN int CeedVectorSetArray(CeedVector vec, CeedMemType mem_type, CeedCopyMode copy_mode, CeedScalar *array); +CEED_EXTERN int CeedVectorSetArrayFP32(CeedVector vec, CeedMemType mem_type, + CeedCopyMode copy_mode, float *array); +CEED_EXTERN int CeedVectorSetArrayFP64(CeedVector vec, CeedMemType mem_type, + CeedCopyMode copy_mode, double *array); CEED_EXTERN int CeedVectorSetValue(CeedVector vec, CeedScalar value); CEED_EXTERN int CeedVectorSyncArray(CeedVector vec, CeedMemType mem_type); +CEED_EXTERN int CeedVectorSyncArrayFP32(CeedVector vec, CeedMemType mem_type); +CEED_EXTERN int CeedVectorSyncArrayFP64(CeedVector vec, CeedMemType mem_type); CEED_EXTERN int CeedVectorTakeArray(CeedVector vec, CeedMemType mem_type, CeedScalar **array); +CEED_EXTERN int CeedVectorTakeArrayFP32(CeedVector vec, CeedMemType mem_type, + float **array); +CEED_EXTERN int CeedVectorTakeArrayFP64(CeedVector vec, CeedMemType mem_type, + double **array); CEED_EXTERN int CeedVectorGetArray(CeedVector vec, CeedMemType mem_type, CeedScalar **array); +CEED_EXTERN int CeedVectorGetArrayFP32(CeedVector vec, CeedMemType mem_type, + float **array); +CEED_EXTERN int CeedVectorGetArrayFP64(CeedVector vec, CeedMemType mem_type, + double **array); CEED_EXTERN int CeedVectorGetArrayRead(CeedVector vec, CeedMemType mem_type, const CeedScalar **array); +CEED_EXTERN int CeedVectorGetArrayReadFP32(CeedVector vec, CeedMemType mem_type, + const float **array); +CEED_EXTERN int CeedVectorGetArrayReadFP64(CeedVector vec, CeedMemType mem_type, + const double **array); CEED_EXTERN int CeedVectorGetArrayWrite(CeedVector vec, CeedMemType mem_type, CeedScalar **array); +CEED_EXTERN int CeedVectorGetArrayWriteFP32(CeedVector vec, CeedMemType mem_type, + float **array); +CEED_EXTERN int CeedVectorGetArrayWriteFP64(CeedVector vec, CeedMemType mem_type, + double **array); CEED_EXTERN int CeedVectorRestoreArray(CeedVector vec, CeedScalar **array); +CEED_EXTERN int CeedVectorRestoreArrayFP32(CeedVector vec, float **array); +CEED_EXTERN int CeedVectorRestoreArrayFP64(CeedVector vec, double **array); CEED_EXTERN int CeedVectorRestoreArrayRead(CeedVector vec, const CeedScalar **array); +CEED_EXTERN int CeedVectorRestoreArrayReadFP32(CeedVector vec, + const float **array); +CEED_EXTERN int CeedVectorRestoreArrayReadFP64(CeedVector vec, + const double **array); CEED_EXTERN int CeedVectorNorm(CeedVector vec, CeedNormType type, CeedScalar *norm); CEED_EXTERN int CeedVectorScale(CeedVector x, CeedScalar alpha); diff --git a/interface/ceed-vector.c b/interface/ceed-vector.c index 8151c54ec0..18a33b2629 100644 --- a/interface/ceed-vector.c +++ b/interface/ceed-vector.c @@ -303,6 +303,46 @@ int CeedVectorSetArray(CeedVector vec, CeedMemType mem_type, (void **) array); } +/** + @brief Version of SetArray for single precision arrays. + + @param vec CeedVector + @param mem_type Memory type of the array being passed + @param copy_mode Copy mode for the array + @param array Array to be used, or NULL with @ref CEED_COPY_VALUES to have the + library allocate + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorSetArrayFP32(CeedVector vec, CeedMemType mem_type, + CeedCopyMode copy_mode, + float *array) { + return CeedVectorSetArrayGeneric(vec, mem_type, CEED_SCALAR_FP32, copy_mode, + (void **) array); +} + +/** + @brief Version of SetArray for double precision arrays. + + @param vec CeedVector + @param mem_type Memory type of the array being passed + @param copy_mode Copy mode for the array + @param array Array to be used, or NULL with @ref CEED_COPY_VALUES to have the + library allocate + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorSetArrayFP64(CeedVector vec, CeedMemType mem_type, + CeedCopyMode copy_mode, + double *array) { + return CeedVectorSetArrayGeneric(vec, mem_type, CEED_SCALAR_FP64, copy_mode, + (void **) array); +} + /** @brief Set the CeedVector to a constant value @@ -393,6 +433,34 @@ int CeedVectorSyncArray(CeedVector vec, CeedMemType mem_type) { return CeedVectorSyncArrayGeneric(vec, mem_type, CEED_SCALAR_TYPE); } +/** + @brief Sync the CeedVector to a specified memtype for single precision. + + @param vec CeedVector + @param mem_type Memtype to be synced + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorSyncArrayFP32(CeedVector vec, CeedMemType mem_type) { + return CeedVectorSyncArrayGeneric(vec, mem_type, CEED_SCALAR_FP32); +} + +/** + @brief Sync the CeedVector to a specified memtype for double precision. + + @param vec CeedVector + @param mem_type Memtype to be synced + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorSyncArrayFP64(CeedVector vec, CeedMemType mem_type) { + return CeedVectorSyncArrayGeneric(vec, mem_type, CEED_SCALAR_FP64); +} + /** @brief Take ownership of the specified precision array set by @ref CeedVectorSetArray() with @ref CEED_USE_POINTER and remove the array from the CeedVector. @@ -479,6 +547,50 @@ int CeedVectorTakeArray(CeedVector vec, CeedMemType mem_type, (void **) array); } +/** + @brief Take ownership of the CeedVector single precision array set by + @ref CeedVectorSetArrayFP32() with @ref CEED_USE_POINTER, and + remove the array from the CeedVector. + The caller is responsible for managing and freeing the array. + + @param vec CeedVector + @param mem_type Memory type on which to take the array. If the backend + uses a different memory type, this will perform a copy. + @param[out] array Array on memory type mem_type, or NULL if array pointer is + not required + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorTakeArrayFP32(CeedVector vec, CeedMemType mem_type, + float **array) { + return CeedVectorTakeArrayGeneric(vec, mem_type, CEED_SCALAR_FP32, + (void **) array); +} + +/** + @brief Take ownership of the CeedVector double precision array set by + @ref CeedVectorSetArrayFP64() with @ref CEED_USE_POINTER, and + remove the array from the CeedVector. + The caller is responsible for managing and freeing the array. + + @param vec CeedVector + @param mem_type Memory type on which to take the array. If the backend + uses a different memory type, this will perform a copy. + @param[out] array Array on memory type mem_type, or NULL if array pointer is + not required + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorTakeArrayFP64(CeedVector vec, CeedMemType mem_type, + double **array) { + return CeedVectorTakeArrayGeneric(vec, mem_type, CEED_SCALAR_FP64, + (void **) array); +} + /** @brief Get read/write access to a CeedVector via the specified memory type and scalar precision. @@ -560,6 +672,46 @@ int CeedVectorGetArray(CeedVector vec, CeedMemType mem_type, (void **) array); } +/** + @brief Get single precision read/write access to a CeedVector via the + specified memory type. + Restore access with @ref CeedVectorRestoreArrayFP32(). + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. If the backend + uses a different memory type, this will perform a copy. + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayFP32(CeedVector vec, CeedMemType mem_type, + float **array) { + return CeedVectorGetArrayGeneric(vec, mem_type, CEED_SCALAR_FP32, + (void **) array); +} + +/** + @brief Get double precision read/write access to a CeedVector via the + specified memory type. + Restore access with @ref CeedVectorRestoreArrayFP64(). + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. If the backend + uses a different memory type, this will perform a copy. + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayFP64(CeedVector vec, CeedMemType mem_type, + double **array) { + return CeedVectorGetArrayGeneric(vec, mem_type, CEED_SCALAR_FP64, + (void **) array); +} + /** @brief Get read-only access to a CeedVector via the specified memory type and precision. @@ -630,6 +782,48 @@ int CeedVectorGetArrayRead(CeedVector vec, CeedMemType mem_type, (const void **) array); } +/** + @brief Get read-only single precision access to a CeedVector via the + specified memory type. + Restore access with @ref CeedVectorRestoreArrayReadFP32(). + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. If the backend + uses a different memory type, this will perform a copy + (possibly cached). + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayReadFP32(CeedVector vec, CeedMemType mem_type, + const float **array) { + return CeedVectorGetArrayReadGeneric(vec, mem_type, CEED_SCALAR_FP32, + (const void **) array); +} + +/** + @brief Get read-only double precision access to a CeedVector via the + specified memory type. + Restore access with @ref CeedVectorRestoreArrayReadFP64(). + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. If the backend + uses a different memory type, this will perform a copy + (possibly cached). + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayReadFP64(CeedVector vec, CeedMemType mem_type, + const double **array) { + return CeedVectorGetArrayReadGeneric(vec, mem_type, CEED_SCALAR_FP64, + (const void **) array); +} + /** @brief Get write access to a CeedVector via the specified memory type and precision. @@ -695,6 +889,46 @@ int CeedVectorGetArrayWrite(CeedVector vec, CeedMemType mem_type, (void **) array); } +/** + @brief Get single precision write access to a CeedVector via the specified + memory type. + Restore access with @ref CeedVectorRestoreArrayFP32(). All old + values should be assumed to be invalid. + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayWriteFP32(CeedVector vec, CeedMemType mem_type, + float **array) { + return CeedVectorGetArrayWriteGeneric(vec, mem_type, CEED_SCALAR_FP32, + (void **) array); +} + +/** + @brief Get double precision write access to a CeedVector via the specified + memory type. + Restore access with @ref CeedVectorRestoreArrayFP64(). All old + values should be assumed to be invalid. + + @param vec CeedVector to access + @param mem_type Memory type on which to access the array. + @param[out] array Array on memory type mem_type + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorGetArrayWriteFP64(CeedVector vec, CeedMemType mem_type, + double **array) { + return CeedVectorGetArrayWriteGeneric(vec, mem_type, CEED_SCALAR_FP64, + (void **) array); +} + /** @brief Restore an array obtained using @ref CeedVectorGetArrayGeneric() or @ref CeedVectorGetArrayWriteGeneric() @@ -736,6 +970,36 @@ int CeedVectorRestoreArray(CeedVector vec, CeedScalar **array) { return CeedVectorRestoreArrayGeneric(vec, (void **) array); } +/** + @brief Restore an array obtained using @ref CeedVectorGetArrayFP32() + or @ref CeedVectorGetArrayWriteFP32() + + @param vec CeedVector to restore + @param array Array of vector data + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorRestoreArrayFP32(CeedVector vec, float **array) { + return CeedVectorRestoreArrayGeneric(vec, (void **) array); +} + +/** + @brief Restore an array obtained using @ref CeedVectorGetArrayFP64() + or @ref CeedVectorGetArrayWriteFP64() + + @param vec CeedVector to restore + @param array Array of vector data + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorRestoreArrayFP64(CeedVector vec, double **array) { + return CeedVectorRestoreArrayGeneric(vec, (void **) array); +} + /** @brief Restore an array obtained using @ref CeedVectorGetArrayReadGeneric() @@ -778,6 +1042,34 @@ int CeedVectorRestoreArrayRead(CeedVector vec, const CeedScalar **array) { return CeedVectorRestoreArrayReadGeneric(vec, (const void **) array); } +/** + @brief Restore an array obtained using @ref CeedVectorGetArrayReadFP32() + + @param vec CeedVector to restore + @param array Array of vector data + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorRestoreArrayReadFP32(CeedVector vec, const float **array) { + return CeedVectorRestoreArrayReadGeneric(vec, (const void **) array); +} + +/** + @brief Restore an array obtained using @ref CeedVectorGetArrayReadFP64() + + @param vec CeedVector to restore + @param array Array of vector data + + @return An error code: 0 - success, otherwise - failure + + @ref User +**/ +int CeedVectorRestoreArrayReadFP64(CeedVector vec, const double **array) { + return CeedVectorRestoreArrayReadGeneric(vec, (const void **) array); +} + /** @brief Get the norm of a CeedVector. From fd75fdf7cc4919c94f2cfa77e54d2cdeae8b776f Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Fri, 22 Apr 2022 14:05:51 -0600 Subject: [PATCH 06/10] WIP, experimental: add user-level function for checking array status for different precisions --- backends/hip-ref/ceed-hip-ref-vector.c | 43 ++++++++++++++++++++++++++ include/ceed-impl.h | 2 ++ include/ceed/ceed.h | 3 ++ interface/ceed-vector.c | 33 ++++++++++++++++++++ interface/ceed.c | 1 + 5 files changed, 82 insertions(+) diff --git a/backends/hip-ref/ceed-hip-ref-vector.c b/backends/hip-ref/ceed-hip-ref-vector.c index 7e07b7d8db..68b9e8a617 100644 --- a/backends/hip-ref/ceed-hip-ref-vector.c +++ b/backends/hip-ref/ceed-hip-ref-vector.c @@ -35,6 +35,47 @@ static inline int CeedScalarTypeGetSize_Hip(Ceed ceed, CeedScalarType prec, return CEED_ERROR_SUCCESS; } +//------------------------------------------------------------------------------ +// Get info about the current status of the different precisions in the +// valid, borrowed, and owned arrays, for a specific mem_type +//------------------------------------------------------------------------------ +static int CeedVectorCheckArrayStatus_Hip(CeedVector vec, + CeedMemType mem_type, + unsigned int *valid_status, + unsigned int *borrowed_status, + unsigned int *owned_status) { + + int ierr; + CeedVector_Hip *impl; + ierr = CeedVectorGetData(vec, &impl); CeedChkBackend(ierr); + *valid_status = 0; + *borrowed_status = 0; + *owned_status = 0; + switch(mem_type) { + case CEED_MEM_HOST: + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + if (!!impl->h_array.values[i]) + *valid_status += 1 << i; + if (!!impl->h_array_borrowed.values[i]) + *borrowed_status += 1 << i; + if (!!impl->h_array_owned.values[i]) + *owned_status += 1 << i; + } + break; + case CEED_MEM_DEVICE: + for (int i = 0; i < CEED_NUM_PRECISIONS; i++) { + if (!!impl->d_array.values[i]) + *valid_status += 1 << i; + if (!!impl->d_array_borrowed.values[i]) + *borrowed_status += 1 << i; + if (!!impl->d_array_owned.values[i]) + *owned_status += 1 << i; + } + break; + } + return CEED_ERROR_SUCCESS; +} + //------------------------------------------------------------------------------ // Set all pointers as invalid //------------------------------------------------------------------------------ @@ -1171,6 +1212,8 @@ int CeedVectorCreate_Hip(CeedSize n, CeedVector vec) { ierr = CeedSetBackendFunction(ceed, "Vector", vec, "HasBorrowedArrayOfType", CeedVectorHasBorrowedArrayOfType_Hip); CeedChkBackend(ierr); + ierr = CeedSetBackendFunction(ceed, "Vector", vec, "CheckArrayStatus", + CeedVectorCheckArrayStatus_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "SetArrayGeneric", CeedVectorSetArrayGeneric_Hip); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Vector", vec, "TakeArrayGeneric", diff --git a/include/ceed-impl.h b/include/ceed-impl.h index be1445adde..993d3088e8 100644 --- a/include/ceed-impl.h +++ b/include/ceed-impl.h @@ -129,6 +129,8 @@ struct CeedVector_private { Ceed ceed; int (*HasValidArray)(CeedVector, bool *); int (*HasBorrowedArrayOfType)(CeedVector, CeedMemType, CeedScalarType, bool *); + int (*CheckArrayStatus)(CeedVector, CeedMemType, unsigned int *, unsigned int *, + unsigned int *); int (*SetArrayGeneric)(CeedVector, CeedMemType, CeedScalarType, CeedCopyMode, void *); int (*SetValue)(CeedVector, CeedScalar); diff --git a/include/ceed/ceed.h b/include/ceed/ceed.h index 498b51e570..3a8268dcd1 100644 --- a/include/ceed/ceed.h +++ b/include/ceed/ceed.h @@ -398,6 +398,9 @@ CEED_EXTERN int CeedVectorRestoreArrayReadFP32(CeedVector vec, const float **array); CEED_EXTERN int CeedVectorRestoreArrayReadFP64(CeedVector vec, const double **array); +CEED_EXTERN int CeedVectorCheckArrayStatus(CeedVector vec, CeedMemType mem_type, + unsigned int *valid_status, unsigned int *borrowed_status, + unsigned int *owned_status); CEED_EXTERN int CeedVectorNorm(CeedVector vec, CeedNormType type, CeedScalar *norm); CEED_EXTERN int CeedVectorScale(CeedVector x, CeedScalar alpha); diff --git a/interface/ceed-vector.c b/interface/ceed-vector.c index 18a33b2629..2896fe97ef 100644 --- a/interface/ceed-vector.c +++ b/interface/ceed-vector.c @@ -1070,6 +1070,39 @@ int CeedVectorRestoreArrayReadFP64(CeedVector vec, const double **array) { return CeedVectorRestoreArrayReadGeneric(vec, (const void **) array); } +/** + @brief Check the current status of the CeedVector's data arrays. + + This function sets unsigned int parameters indicating for which precisions + the data for mem_type is not NULL, for borrowed and owned arrays, and also + which precisions are currently valid. + The values can be checked bitwise, such that, e.g., + (valid_status & (1 << CEED_SCALAR_FP32)) will be true if the FP32 array is + currently valid, and false otherwise. + + @param vec CeedVector for which to check status + @param mem_type Mem type for which to check status + @param valid_status Status indicator for valid data + @param borrowed_status Status indicator for borrowed arrays + @param owned_status Status indicator for owned arrays +**/ +int CeedVectorCheckArrayStatus(CeedVector vec, CeedMemType mem_type, + unsigned int *valid_status, + unsigned int *borrowed_status, + unsigned int *owned_status) { + int ierr; + + if (!vec->CheckArrayStatus) + // LCOV_EXCL_START + return CeedError(vec->ceed, CEED_ERROR_UNSUPPORTED, + "Backend does not support CheckArrayStatus"); + // LCOV_EXCL_STOP + + ierr = vec->CheckArrayStatus(vec, mem_type, valid_status, borrowed_status, + owned_status); CeedChk(ierr); + return CEED_ERROR_SUCCESS; +} + /** @brief Get the norm of a CeedVector. diff --git a/interface/ceed.c b/interface/ceed.c index 646f26e193..f4869fed8e 100644 --- a/interface/ceed.c +++ b/interface/ceed.c @@ -848,6 +848,7 @@ int CeedInit(const char *resource, Ceed *ceed) { CEED_FTABLE_ENTRY(CeedVector, GetArrayWriteGeneric), CEED_FTABLE_ENTRY(CeedVector, RestoreArrayGeneric), CEED_FTABLE_ENTRY(CeedVector, RestoreArrayReadGeneric), + CEED_FTABLE_ENTRY(CeedVector, CheckArrayStatus), CEED_FTABLE_ENTRY(CeedVector, Norm), CEED_FTABLE_ENTRY(CeedVector, Scale), CEED_FTABLE_ENTRY(CeedVector, AXPY), From 80606a95a4eeebc1d18547a1d3a86f3777f9a542 Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Tue, 26 Apr 2022 17:30:41 -0600 Subject: [PATCH 07/10] WIP: use Generic vector access functions and void pointers in other backend functions --- backends/hip-ref/ceed-hip-ref-basis.c | 32 ++++-- backends/hip-ref/ceed-hip-ref-operator.c | 118 ++++++++++++-------- backends/hip-ref/ceed-hip-ref-qfunction.c | 10 +- backends/hip-ref/ceed-hip-ref-restriction.c | 19 ++-- backends/hip-ref/ceed-hip-ref.h | 4 +- 5 files changed, 113 insertions(+), 70 deletions(-) diff --git a/backends/hip-ref/ceed-hip-ref-basis.c b/backends/hip-ref/ceed-hip-ref-basis.c index 16a509b81d..6e0b3de402 100644 --- a/backends/hip-ref/ceed-hip-ref-basis.c +++ b/backends/hip-ref/ceed-hip-ref-basis.c @@ -29,12 +29,16 @@ int CeedBasisApply_Hip(CeedBasis basis, const CeedInt num_elem, const int max_block_size = 64; // Read vectors - const CeedScalar *d_u; - CeedScalar *d_v; + const void *d_u; + void *d_v; if (eval_mode != CEED_EVAL_WEIGHT) { - ierr = CeedVectorGetArrayRead(u, CEED_MEM_DEVICE, &d_u); CeedChkBackend(ierr); + ierr = CeedVectorGetArrayReadGeneric(u, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &d_u); + CeedChkBackend(ierr); } - ierr = CeedVectorGetArrayWrite(v, CEED_MEM_DEVICE, &d_v); CeedChkBackend(ierr); + ierr = CeedVectorGetArrayWriteGeneric(v, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &d_v); + CeedChkBackend(ierr); // Clear v for transpose operation if (t_mode == CEED_TRANSPOSE) { @@ -93,9 +97,9 @@ int CeedBasisApply_Hip(CeedBasis basis, const CeedInt num_elem, // Restore vectors if (eval_mode != CEED_EVAL_WEIGHT) { - ierr = CeedVectorRestoreArrayRead(u, &d_u); CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayReadGeneric(u, &d_u); CeedChkBackend(ierr); } - ierr = CeedVectorRestoreArray(v, &d_v); CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayGeneric(v, &d_v); CeedChkBackend(ierr); return CEED_ERROR_SUCCESS; } @@ -121,12 +125,16 @@ int CeedBasisApplyNonTensor_Hip(CeedBasis basis, const CeedInt num_elem, num_elem/elemsPerBlock*elemsPerBlockevecs[i]) { // No restriction for this field; read data directly from vec. - ierr = CeedVectorGetArrayRead(vec, CEED_MEM_DEVICE, - (const CeedScalar **) &edata[i]); + ierr = CeedVectorGetArrayReadGeneric(vec, CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, (const void **) &edata[i]); CeedChkBackend(ierr); } else { ierr = CeedElemRestrictionApply(Erestrict, CEED_NOTRANSPOSE, vec, impl->evecs[i], request); CeedChkBackend(ierr); // Get evec - ierr = CeedVectorGetArrayRead(impl->evecs[i], CEED_MEM_DEVICE, - (const CeedScalar **) &edata[i]); + ierr = CeedVectorGetArrayReadGeneric(impl->evecs[i], CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, (const void **) &edata[i]); CeedChkBackend(ierr); } } @@ -299,7 +299,7 @@ static inline int CeedOperatorSetupInputs_Hip(CeedInt numinputfields, static inline int CeedOperatorInputBasis_Hip(CeedInt numelements, CeedQFunctionField *qfinputfields, CeedOperatorField *opinputfields, CeedInt numinputfields, const bool skipactive, - CeedScalar *edata[2*CEED_FIELD_MAX], CeedOperator_Hip *impl) { + void *edata[2*CEED_FIELD_MAX], CeedOperator_Hip *impl) { CeedInt ierr; CeedInt elemsize, size; CeedElemRestriction Erestrict; @@ -325,8 +325,9 @@ static inline int CeedOperatorInputBasis_Hip(CeedInt numelements, // Basis action switch (emode) { case CEED_EVAL_NONE: - ierr = CeedVectorSetArray(impl->qvecsin[i], CEED_MEM_DEVICE, - CEED_USE_POINTER, edata[i]); CeedChkBackend(ierr); + ierr = CeedVectorSetArrayGeneric(impl->qvecsin[i], CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, CEED_USE_POINTER, edata[i]); + CeedChkBackend(ierr); break; case CEED_EVAL_INTERP: ierr = CeedOperatorFieldGetBasis(opinputfields[i], &basis); @@ -358,7 +359,7 @@ static inline int CeedOperatorInputBasis_Hip(CeedInt numelements, //------------------------------------------------------------------------------ static inline int CeedOperatorRestoreInputs_Hip(CeedInt numinputfields, CeedQFunctionField *qfinputfields, CeedOperatorField *opinputfields, - const bool skipactive, CeedScalar *edata[2*CEED_FIELD_MAX], + const bool skipactive, void *edata[2*CEED_FIELD_MAX], CeedOperator_Hip *impl) { CeedInt ierr; CeedEvalMode emode; @@ -377,12 +378,12 @@ static inline int CeedOperatorRestoreInputs_Hip(CeedInt numinputfields, } else { if (!impl->evecs[i]) { // This was a skiprestrict case ierr = CeedOperatorFieldGetVector(opinputfields[i], &vec); CeedChkBackend(ierr); - ierr = CeedVectorRestoreArrayRead(vec, - (const CeedScalar **)&edata[i]); + ierr = CeedVectorRestoreArrayReadGeneric(vec, + (const void **)&edata[i]); CeedChkBackend(ierr); } else { - ierr = CeedVectorRestoreArrayRead(impl->evecs[i], - (const CeedScalar **) &edata[i]); + ierr = CeedVectorRestoreArrayReadGeneric(impl->evecs[i], + (const void **) &edata[i]); CeedChkBackend(ierr); } } @@ -414,7 +415,7 @@ static int CeedOperatorApplyAdd_Hip(CeedOperator op, CeedVector invec, CeedVector vec; CeedBasis basis; CeedElemRestriction Erestrict; - CeedScalar *edata[2*CEED_FIELD_MAX]; + void *edata[2*CEED_FIELD_MAX]; // Setup ierr = CeedOperatorSetup_Hip(op); CeedChkBackend(ierr); @@ -435,10 +436,13 @@ static int CeedOperatorApplyAdd_Hip(CeedOperator op, CeedVector invec, CeedChkBackend(ierr); if (emode == CEED_EVAL_NONE) { // Set the output Q-Vector to use the E-Vector data directly. - ierr = CeedVectorGetArrayWrite(impl->evecs[i + impl->numein], CEED_MEM_DEVICE, - &edata[i + numinputfields]); CeedChkBackend(ierr); - ierr = CeedVectorSetArray(impl->qvecsout[i], CEED_MEM_DEVICE, - CEED_USE_POINTER, edata[i + numinputfields]); + ierr = CeedVectorGetArrayWriteGeneric(impl->evecs[i + impl->numein], + CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, &edata[i + numinputfields]); + CeedChkBackend(ierr); + ierr = CeedVectorSetArrayGeneric(impl->qvecsout[i], CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, CEED_USE_POINTER, + edata[i + numinputfields]); CeedChkBackend(ierr); } } @@ -498,8 +502,8 @@ static int CeedOperatorApplyAdd_Hip(CeedOperator op, CeedVector invec, ierr = CeedQFunctionFieldGetEvalMode(qfoutputfields[i], &emode); CeedChkBackend(ierr); if (emode == CEED_EVAL_NONE) { - ierr = CeedVectorRestoreArray(impl->evecs[i+impl->numein], - &edata[i + numinputfields]); + ierr = CeedVectorRestoreArrayGeneric(impl->evecs[i+impl->numein], + &edata[i + numinputfields]); CeedChkBackend(ierr); } // Get output vector @@ -549,13 +553,17 @@ static inline int CeedOperatorLinearAssembleQFunctionCore_Hip(CeedOperator op, CeedVector vec; CeedInt numactivein = impl->qfnumactivein, numactiveout = impl->qfnumactiveout; CeedVector *activein = impl->qfactivein; - CeedScalar *a, *tmp; + void *a, *tmp; + size_t prec_size = sizeof(double); + if (CEED_SCALAR_TYPE == CEED_SCALAR_FP32) { + prec_size = sizeof(float); + } Ceed ceed, ceedparent; ierr = CeedOperatorGetCeed(op, &ceed); CeedChkBackend(ierr); ierr = CeedGetOperatorFallbackParentCeed(ceed, &ceedparent); CeedChkBackend(ierr); ceedparent = ceedparent ? ceedparent : ceed; - CeedScalar *edata[2*CEED_FIELD_MAX]; + void *edata[2*CEED_FIELD_MAX]; // Setup ierr = CeedOperatorSetup_Hip(op); CeedChkBackend(ierr); @@ -582,20 +590,24 @@ static inline int CeedOperatorLinearAssembleQFunctionCore_Hip(CeedOperator op, // Check if active input if (vec == CEED_VECTOR_ACTIVE) { ierr = CeedQFunctionFieldGetSize(qfinputfields[i], &size); CeedChkBackend(ierr); + //todo: generic version of SetValue? ierr = CeedVectorSetValue(impl->qvecsin[i], 0.0); CeedChkBackend(ierr); - ierr = CeedVectorGetArray(impl->qvecsin[i], CEED_MEM_DEVICE, &tmp); + ierr = CeedVectorGetArrayGeneric(impl->qvecsin[i], CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, &tmp); CeedChkBackend(ierr); ierr = CeedRealloc(numactivein + size, &activein); CeedChkBackend(ierr); for (CeedInt field = 0; field < size; field++) { q_size = (CeedSize)Q*numelements; ierr = CeedVectorCreate(ceed, q_size, &activein[numactivein+field]); CeedChkBackend(ierr); - ierr = CeedVectorSetArray(activein[numactivein+field], CEED_MEM_DEVICE, - CEED_USE_POINTER, &tmp[field*Q*numelements]); + ierr = CeedVectorSetArrayGeneric(activein[numactivein+field], CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, CEED_USE_POINTER, + (void *) ((char *)(tmp) + prec_size*field*Q*numelements)); CeedChkBackend(ierr); } numactivein += size; - ierr = CeedVectorRestoreArray(impl->qvecsin[i], &tmp); CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayGeneric(impl->qvecsin[i], &tmp); + CeedChkBackend(ierr); } } impl->qfnumactivein = numactivein; @@ -638,8 +650,10 @@ static inline int CeedOperatorLinearAssembleQFunctionCore_Hip(CeedOperator op, CeedSize l_size = (CeedSize)numelements*Q*numactivein*numactiveout; ierr = CeedVectorCreate(ceedparent, l_size, assembled); CeedChkBackend(ierr); } + // todo: generic SetValue? ierr = CeedVectorSetValue(*assembled, 0.0); CeedChkBackend(ierr); - ierr = CeedVectorGetArray(*assembled, CEED_MEM_DEVICE, &a); + ierr = CeedVectorGetArrayGeneric(*assembled, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &a); CeedChkBackend(ierr); // Input basis apply @@ -662,11 +676,12 @@ static inline int CeedOperatorLinearAssembleQFunctionCore_Hip(CeedOperator op, CeedChkBackend(ierr); // Check if active output if (vec == CEED_VECTOR_ACTIVE) { - CeedVectorSetArray(impl->qvecsout[out], CEED_MEM_DEVICE, - CEED_USE_POINTER, a); CeedChkBackend(ierr); + CeedVectorSetArrayGeneric(impl->qvecsout[out], CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, CEED_USE_POINTER, a); CeedChkBackend(ierr); ierr = CeedQFunctionFieldGetSize(qfoutputfields[out], &size); CeedChkBackend(ierr); - a += size*Q*numelements; // Advance the pointer by the size of the output + a = (void *) ((char *)(a) + + prec_size*size*Q*numelements); // Advance the pointer by the size of the output } } // Apply QFunction @@ -681,7 +696,8 @@ static inline int CeedOperatorLinearAssembleQFunctionCore_Hip(CeedOperator op, CeedChkBackend(ierr); // Check if active output if (vec == CEED_VECTOR_ACTIVE) { - ierr = CeedVectorTakeArray(impl->qvecsout[out], CEED_MEM_DEVICE, NULL); + ierr = CeedVectorTakeArrayGeneric(impl->qvecsout[out], CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, NULL); CeedChkBackend(ierr); } } @@ -692,7 +708,7 @@ static inline int CeedOperatorLinearAssembleQFunctionCore_Hip(CeedOperator op, CeedChkBackend(ierr); // Restore output - ierr = CeedVectorRestoreArray(*assembled, &a); CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayGeneric(*assembled, &a); CeedChkBackend(ierr); return CEED_ERROR_SUCCESS; } @@ -1150,11 +1166,14 @@ static inline int CeedOperatorAssembleDiagonalCore_Hip(CeedOperator op, ierr = CeedVectorSetValue(elemdiag, 0.0); CeedChkBackend(ierr); // Assemble element operator diagonals - CeedScalar *elemdiagarray; - const CeedScalar *assembledqfarray; - ierr = CeedVectorGetArray(elemdiag, CEED_MEM_DEVICE, &elemdiagarray); + void *elemdiagarray; + const void *assembledqfarray; + ierr = CeedVectorGetArrayGeneric(elemdiag, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &elemdiagarray); CeedChkBackend(ierr); - ierr = CeedVectorGetArrayRead(assembledqf, CEED_MEM_DEVICE, &assembledqfarray); + ierr = CeedVectorGetArrayReadGeneric(assembledqf, CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, + &assembledqfarray); CeedChkBackend(ierr); CeedInt nelem; ierr = CeedElemRestrictionGetNumElements(diagrstr, &nelem); @@ -1179,8 +1198,9 @@ static inline int CeedOperatorAssembleDiagonalCore_Hip(CeedOperator op, } // Restore arrays - ierr = CeedVectorRestoreArray(elemdiag, &elemdiagarray); CeedChkBackend(ierr); - ierr = CeedVectorRestoreArrayRead(assembledqf, &assembledqfarray); + ierr = CeedVectorRestoreArrayGeneric(elemdiag, &elemdiagarray); + CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayReadGeneric(assembledqf, &assembledqfarray); CeedChkBackend(ierr); // Assemble local operator diagonal @@ -1587,12 +1607,19 @@ static int CeedSingleOperatorAssemble_Hip(CeedOperator op, CeedInt offset, ierr = CeedOperatorLinearAssembleQFunctionBuildOrUpdate( op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE); CeedChkBackend(ierr); ierr = CeedElemRestrictionDestroy(&rstr_q); CeedChkBackend(ierr); - CeedScalar *values_array; - ierr = CeedVectorGetArrayWrite(values, CEED_MEM_DEVICE, &values_array); + void *values_array; + ierr = CeedVectorGetArrayWriteGeneric(values, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &values_array); CeedChkBackend(ierr); - values_array += offset; - const CeedScalar *qf_array; - ierr = CeedVectorGetArrayRead(assembled_qf, CEED_MEM_DEVICE, &qf_array); + size_t prec_size = sizeof(double); + if (CEED_SCALAR_TYPE == CEED_SCALAR_FP32) { + prec_size = sizeof(float); + } + values_array = (void *)((char *)(values_array) + prec_size*offset); + const void *qf_array; + ierr = CeedVectorGetArrayReadGeneric(assembled_qf, CEED_MEM_DEVICE, + CEED_SCALAR_TYPE, + &qf_array); CeedChkBackend(ierr); // Compute B^T D B @@ -1610,8 +1637,9 @@ static int CeedSingleOperatorAssemble_Hip(CeedOperator op, CeedInt offset, // Restore arrays - ierr = CeedVectorRestoreArray(values, &values_array); CeedChkBackend(ierr); - ierr = CeedVectorRestoreArrayRead(assembled_qf, &qf_array); + ierr = CeedVectorRestoreArrayGeneric(values, &values_array); + CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayReadGeneric(assembled_qf, &qf_array); CeedChkBackend(ierr); // Cleanup diff --git a/backends/hip-ref/ceed-hip-ref-qfunction.c b/backends/hip-ref/ceed-hip-ref-qfunction.c index ddebbf3785..d8fe4eb902 100644 --- a/backends/hip-ref/ceed-hip-ref-qfunction.c +++ b/backends/hip-ref/ceed-hip-ref-qfunction.c @@ -37,11 +37,13 @@ static int CeedQFunctionApply_Hip(CeedQFunction qf, CeedInt Q, // Read vectors for (CeedInt i = 0; i < num_input_fields; i++) { - ierr = CeedVectorGetArrayRead(U[i], CEED_MEM_DEVICE, &data->fields.inputs[i]); + ierr = CeedVectorGetArrayReadGeneric(U[i], CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &data->fields.inputs[i]); CeedChkBackend(ierr); } for (CeedInt i = 0; i < num_output_fields; i++) { - ierr = CeedVectorGetArrayWrite(V[i], CEED_MEM_DEVICE, &data->fields.outputs[i]); + ierr = CeedVectorGetArrayWriteGeneric(V[i], CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &data->fields.outputs[i]); CeedChkBackend(ierr); } @@ -56,11 +58,11 @@ static int CeedQFunctionApply_Hip(CeedQFunction qf, CeedInt Q, // Restore vectors for (CeedInt i = 0; i < num_input_fields; i++) { - ierr = CeedVectorRestoreArrayRead(U[i], &data->fields.inputs[i]); + ierr = CeedVectorRestoreArrayReadGeneric(U[i], &data->fields.inputs[i]); CeedChkBackend(ierr); } for (CeedInt i = 0; i < num_output_fields; i++) { - ierr = CeedVectorRestoreArray(V[i], &data->fields.outputs[i]); + ierr = CeedVectorRestoreArrayGeneric(V[i], &data->fields.outputs[i]); CeedChkBackend(ierr); } diff --git a/backends/hip-ref/ceed-hip-ref-restriction.c b/backends/hip-ref/ceed-hip-ref-restriction.c index f332ee4568..01f275e9ac 100644 --- a/backends/hip-ref/ceed-hip-ref-restriction.c +++ b/backends/hip-ref/ceed-hip-ref-restriction.c @@ -35,15 +35,20 @@ static int CeedElemRestrictionApply_Hip(CeedElemRestriction r, hipFunction_t kernel; // Get vectors - const CeedScalar *d_u; - CeedScalar *d_v; - ierr = CeedVectorGetArrayRead(u, CEED_MEM_DEVICE, &d_u); CeedChkBackend(ierr); + const void *d_u; + void *d_v; + ierr = CeedVectorGetArrayReadGeneric(u, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &d_u); + CeedChkBackend(ierr); if (t_mode == CEED_TRANSPOSE) { // Sum into for transpose mode, e-vec to l-vec - ierr = CeedVectorGetArray(v, CEED_MEM_DEVICE, &d_v); CeedChkBackend(ierr); + ierr = CeedVectorGetArrayGeneric(v, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, &d_v); + CeedChkBackend(ierr); } else { // Overwrite for notranspose mode, l-vec to e-vec - ierr = CeedVectorGetArrayWrite(v, CEED_MEM_DEVICE, &d_v); CeedChkBackend(ierr); + ierr = CeedVectorGetArrayWriteGeneric(v, CEED_MEM_DEVICE, CEED_SCALAR_TYPE, + &d_v); + CeedChkBackend(ierr); } // Restrict @@ -87,8 +92,8 @@ static int CeedElemRestrictionApply_Hip(CeedElemRestriction r, *request = NULL; // Restore arrays - ierr = CeedVectorRestoreArrayRead(u, &d_u); CeedChkBackend(ierr); - ierr = CeedVectorRestoreArray(v, &d_v); CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayReadGeneric(u, &d_u); CeedChkBackend(ierr); + ierr = CeedVectorRestoreArrayGeneric(v, &d_v); CeedChkBackend(ierr); return CEED_ERROR_SUCCESS; } diff --git a/backends/hip-ref/ceed-hip-ref.h b/backends/hip-ref/ceed-hip-ref.h index 845b1e537d..7f7e93637d 100644 --- a/backends/hip-ref/ceed-hip-ref.h +++ b/backends/hip-ref/ceed-hip-ref.h @@ -62,8 +62,8 @@ typedef struct { // We use a struct to avoid having to memCpy the array of pointers // __global__ copies by value the struct. typedef struct { - const CeedScalar *inputs[CEED_FIELD_MAX]; - CeedScalar *outputs[CEED_FIELD_MAX]; + const void *inputs[CEED_FIELD_MAX]; + void *outputs[CEED_FIELD_MAX]; } Fields_Hip; typedef struct { From 5c8e2068441519be7384b49e12b7d94e1a2ccf20 Mon Sep 17 00:00:00 2001 From: Jed Brown Date: Mon, 2 May 2022 19:20:52 -0600 Subject: [PATCH 08/10] include: cleaner CEED_NUM_PRECISIONS --- include/ceed/ceed.h | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/include/ceed/ceed.h b/include/ceed/ceed.h index 3a8268dcd1..2c4ef57bc0 100644 --- a/include/ceed/ceed.h +++ b/include/ceed/ceed.h @@ -145,14 +145,14 @@ typedef enum { /// Single precision CEED_SCALAR_FP32, /// Double precision - CEED_SCALAR_FP64 + CEED_SCALAR_FP64, + /// Total number of allowed scalar precision types + CEED_NUM_PRECISIONS, } CeedScalarType; -/// Total number of allowed scalar precision types (size of CeedScalarType enum) -#define CEED_NUM_PRECISIONS 2 /// Struct for holding data in multiple precisions for mixed-precision-enabled /// backends typedef struct { - void *values[2]; // Size equals CEED_NUM_PRECISIONS + void *values[CEED_NUM_PRECISIONS]; // Size equals CEED_NUM_PRECISIONS } CeedScalarArray; /// Base scalar type for the library to use: change which header is /// included to change the precision. From df27fe0afae1cd3694d36cdd28059330954b7d52 Mon Sep 17 00:00:00 2001 From: Jed Brown Date: Mon, 2 May 2022 19:21:45 -0600 Subject: [PATCH 09/10] WIP: backends/cuda: fix type mismatch --- backends/cuda-ref/ceed-cuda-vector.c | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/backends/cuda-ref/ceed-cuda-vector.c b/backends/cuda-ref/ceed-cuda-vector.c index c67db91f71..3e605abb68 100644 --- a/backends/cuda-ref/ceed-cuda-vector.c +++ b/backends/cuda-ref/ceed-cuda-vector.c @@ -375,7 +375,7 @@ static int CeedVectorTakeArrayGeneric_Cuda(CeedVector vec, CeedMemType mem_type, bool need_sync = false; ierr = CeedVectorNeedSync_Cuda(vec, mem_type, &need_sync); CeedChkBackend(ierr); if (need_sync) { - ierr = CeedVectorSync_Cuda(vec, mem_type); CeedChkBackend(ierr); + ierr = CeedVectorSync_Cuda(vec, prec, mem_type); CeedChkBackend(ierr); } // Update pointer @@ -415,7 +415,7 @@ static int CeedVectorGetArrayCore_Cuda(const CeedVector vec, CeedChkBackend(ierr); if (need_sync) { // Sync array to requested mem_type - ierr = CeedVectorSync_Cuda(vec, mem_type); CeedChkBackend(ierr); + ierr = CeedVectorSync_Cuda(vec, prec, mem_type); CeedChkBackend(ierr); } // Update pointer From 112a04abfe01131401320829cf208e113026fac4 Mon Sep 17 00:00:00 2001 From: nbeams <246972+nbeams@users.noreply.github.com> Date: Fri, 26 Aug 2022 13:20:26 -0600 Subject: [PATCH 10/10] Resolve conflicts when updating from main --- backends/cuda-ref/ceed-cuda-vector.c | 4 ++-- include/ceed/types.h | 9 ++++++++- 2 files changed, 10 insertions(+), 3 deletions(-) diff --git a/backends/cuda-ref/ceed-cuda-vector.c b/backends/cuda-ref/ceed-cuda-vector.c index 2ec324c2ff..14b6da89b5 100644 --- a/backends/cuda-ref/ceed-cuda-vector.c +++ b/backends/cuda-ref/ceed-cuda-vector.c @@ -113,8 +113,8 @@ static inline int CeedVectorSyncD2H_Cuda(const CeedVector vec) { // Sync arrays //------------------------------------------------------------------------------ static int CeedVectorSyncArrayGeneric_Cuda(const CeedVector vec, - CeedMemType mem_type, - CeedScalarType prec) { + CeedMemType mem_type, + CeedScalarType prec) { int ierr; // Check whether device/host sync is needed bool need_sync = false; diff --git a/include/ceed/types.h b/include/ceed/types.h index f9e74e7afa..161f68c6d3 100644 --- a/include/ceed/types.h +++ b/include/ceed/types.h @@ -112,8 +112,15 @@ typedef enum { /// Single precision CEED_SCALAR_FP32, /// Double precision - CEED_SCALAR_FP64 + CEED_SCALAR_FP64, + /// Total number of allowed scalar precision types + CEED_NUM_PRECISIONS, } CeedScalarType; +/// Struct for holding data in multiple precisions for mixed-precision-enabled +/// backends +typedef struct { + void *values[CEED_NUM_PRECISIONS]; // Size equals CEED_NUM_PRECISIONS +} CeedScalarArray; /// Base scalar type for the library to use: change which header is /// included to change the precision. #include "ceed-f64.h"