#include <ceed.h>
#include <ceed/backend.h>
#include <math.h>
#include <stdbool.h>
#include <string.h>
#include <hip/hip_runtime.h>
#include "../hip/ceed-hip-common.h"
#include "ceed-hip-ref.h"
static inline int CeedVectorNeedSync_Hip(const CeedVector vec, CeedMemType mem_type, bool *need_sync) {
CeedVector_Hip *impl;
bool has_valid_array = false;
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorHasValidArray(vec, &has_valid_array));
switch (mem_type) {
case CEED_MEM_HOST:
*need_sync = has_valid_array && !impl->h_array;
break;
case CEED_MEM_DEVICE:
*need_sync = has_valid_array && !impl->d_array;
break;
}
return CEED_ERROR_SUCCESS;
}
static inline int CeedVectorSyncH2D_Hip(const CeedVector vec) {
Ceed ceed;
CeedSize length;
size_t bytes;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCheck(impl->h_array, ceed, CEED_ERROR_BACKEND, "No valid host data to sync to device");
CeedCallBackend(CeedVectorGetLength(vec, &length));
bytes = length * sizeof(CeedScalar);
if (impl->d_array_borrowed) {
impl->d_array = impl->d_array_borrowed;
} else if (impl->d_array_owned) {
impl->d_array = impl->d_array_owned;
} else {
CeedCallHip(ceed, hipMalloc((void **)&impl->d_array_owned, bytes));
impl->d_array = impl->d_array_owned;
}
CeedCallHip(ceed, hipMemcpy(impl->d_array, impl->h_array, bytes, hipMemcpyHostToDevice));
return CEED_ERROR_SUCCESS;
}
static inline int CeedVectorSyncD2H_Hip(const CeedVector vec) {
Ceed ceed;
CeedSize length;
size_t bytes;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCheck(impl->d_array, ceed, CEED_ERROR_BACKEND, "No valid device data to sync to host");
if (impl->h_array_borrowed) {
impl->h_array = impl->h_array_borrowed;
} else if (impl->h_array_owned) {
impl->h_array = impl->h_array_owned;
} else {
CeedSize length;
CeedCallBackend(CeedVectorGetLength(vec, &length));
CeedCallBackend(CeedCalloc(length, &impl->h_array_owned));
impl->h_array = impl->h_array_owned;
}
CeedCallBackend(CeedVectorGetLength(vec, &length));
bytes = length * sizeof(CeedScalar);
CeedCallHip(ceed, hipMemcpy(impl->h_array, impl->d_array, bytes, hipMemcpyDeviceToHost));
return CEED_ERROR_SUCCESS;
}
static int CeedVectorSyncArray_Hip(const CeedVector vec, CeedMemType mem_type) {
bool need_sync = false;
CeedCallBackend(CeedVectorNeedSync_Hip(vec, mem_type, &need_sync));
if (!need_sync) return CEED_ERROR_SUCCESS;
switch (mem_type) {
case CEED_MEM_HOST:
return CeedVectorSyncD2H_Hip(vec);
case CEED_MEM_DEVICE:
return CeedVectorSyncH2D_Hip(vec);
}
return CEED_ERROR_UNSUPPORTED;
}
static inline int CeedVectorSetAllInvalid_Hip(const CeedVector vec) {
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetData(vec, &impl));
impl->h_array = NULL;
impl->d_array = NULL;
return CEED_ERROR_SUCCESS;
}
static inline int CeedVectorHasValidArray_Hip(const CeedVector vec, bool *has_valid_array) {
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetData(vec, &impl));
*has_valid_array = impl->h_array || impl->d_array;
return CEED_ERROR_SUCCESS;
}
static inline int CeedVectorHasArrayOfType_Hip(const CeedVector vec, CeedMemType mem_type, bool *has_array_of_type) {
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetData(vec, &impl));
switch (mem_type) {
case CEED_MEM_HOST:
*has_array_of_type = impl->h_array_borrowed || impl->h_array_owned;
break;
case CEED_MEM_DEVICE:
*has_array_of_type = impl->d_array_borrowed || impl->d_array_owned;
break;
}
return CEED_ERROR_SUCCESS;
}
static inline int CeedVectorHasBorrowedArrayOfType_Hip(const CeedVector vec, CeedMemType mem_type, bool *has_borrowed_array_of_type) {
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetData(vec, &impl));
switch (mem_type) {
case CEED_MEM_HOST:
*has_borrowed_array_of_type = impl->h_array_borrowed;
break;
case CEED_MEM_DEVICE:
*has_borrowed_array_of_type = impl->d_array_borrowed;
break;
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorSetArrayHost_Hip(const CeedVector vec, const CeedCopyMode copy_mode, CeedScalar *array) {
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetData(vec, &impl));
switch (copy_mode) {
case CEED_COPY_VALUES: {
CeedSize length;
if (!impl->h_array_owned) {
CeedCallBackend(CeedVectorGetLength(vec, &length));
CeedCallBackend(CeedMalloc(length, &impl->h_array_owned));
}
impl->h_array_borrowed = NULL;
impl->h_array = impl->h_array_owned;
if (array) {
CeedSize length;
size_t bytes;
CeedCallBackend(CeedVectorGetLength(vec, &length));
bytes = length * sizeof(CeedScalar);
memcpy(impl->h_array, array, bytes);
}
} break;
case CEED_OWN_POINTER:
CeedCallBackend(CeedFree(&impl->h_array_owned));
impl->h_array_owned = array;
impl->h_array_borrowed = NULL;
impl->h_array = array;
break;
case CEED_USE_POINTER:
CeedCallBackend(CeedFree(&impl->h_array_owned));
impl->h_array_borrowed = array;
impl->h_array = array;
break;
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorSetArrayDevice_Hip(const CeedVector vec, const CeedCopyMode copy_mode, CeedScalar *array) {
Ceed ceed;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
switch (copy_mode) {
case CEED_COPY_VALUES: {
CeedSize length;
size_t bytes;
CeedCallBackend(CeedVectorGetLength(vec, &length));
bytes = length * sizeof(CeedScalar);
if (!impl->d_array_owned) {
CeedCallHip(ceed, hipMalloc((void **)&impl->d_array_owned, bytes));
}
impl->d_array_borrowed = NULL;
impl->d_array = impl->d_array_owned;
if (array) CeedCallHip(ceed, hipMemcpy(impl->d_array, array, bytes, hipMemcpyDeviceToDevice));
} break;
case CEED_OWN_POINTER:
CeedCallHip(ceed, hipFree(impl->d_array_owned));
impl->d_array_owned = array;
impl->d_array_borrowed = NULL;
impl->d_array = array;
break;
case CEED_USE_POINTER:
CeedCallHip(ceed, hipFree(impl->d_array_owned));
impl->d_array_owned = NULL;
impl->d_array_borrowed = array;
impl->d_array = array;
break;
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorSetArray_Hip(const CeedVector vec, const CeedMemType mem_type, const CeedCopyMode copy_mode, CeedScalar *array) {
Ceed ceed;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorSetAllInvalid_Hip(vec));
switch (mem_type) {
case CEED_MEM_HOST:
return CeedVectorSetArrayHost_Hip(vec, copy_mode, array);
case CEED_MEM_DEVICE:
return CeedVectorSetArrayDevice_Hip(vec, copy_mode, array);
}
return CEED_ERROR_UNSUPPORTED;
}
static int CeedHostSetValue_Hip(CeedScalar *h_array, CeedSize length, CeedScalar val) {
for (CeedSize i = 0; i < length; i++) h_array[i] = val;
return CEED_ERROR_SUCCESS;
}
int CeedDeviceSetValue_Hip(CeedScalar *d_array, CeedSize length, CeedScalar val);
static int CeedVectorSetValue_Hip(CeedVector vec, CeedScalar val) {
Ceed ceed;
CeedSize length;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorGetLength(vec, &length));
if (!impl->d_array && !impl->h_array) {
if (impl->d_array_borrowed) {
impl->d_array = impl->d_array_borrowed;
} else if (impl->h_array_borrowed) {
impl->h_array = impl->h_array_borrowed;
} else if (impl->d_array_owned) {
impl->d_array = impl->d_array_owned;
} else if (impl->h_array_owned) {
impl->h_array = impl->h_array_owned;
} else {
CeedCallBackend(CeedVectorSetArray(vec, CEED_MEM_DEVICE, CEED_COPY_VALUES, NULL));
}
}
if (impl->d_array) {
CeedCallBackend(CeedDeviceSetValue_Hip(impl->d_array, length, val));
impl->h_array = NULL;
}
if (impl->h_array) {
CeedCallBackend(CeedHostSetValue_Hip(impl->h_array, length, val));
impl->d_array = NULL;
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorTakeArray_Hip(CeedVector vec, CeedMemType mem_type, CeedScalar **array) {
Ceed ceed;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorSyncArray(vec, mem_type));
switch (mem_type) {
case CEED_MEM_HOST:
(*array) = impl->h_array_borrowed;
impl->h_array_borrowed = NULL;
impl->h_array = NULL;
break;
case CEED_MEM_DEVICE:
(*array) = impl->d_array_borrowed;
impl->d_array_borrowed = NULL;
impl->d_array = NULL;
break;
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorGetArrayCore_Hip(const CeedVector vec, const CeedMemType mem_type, CeedScalar **array) {
Ceed ceed;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorSyncArray(vec, mem_type));
switch (mem_type) {
case CEED_MEM_HOST:
*array = impl->h_array;
break;
case CEED_MEM_DEVICE:
*array = impl->d_array;
break;
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorGetArrayRead_Hip(const CeedVector vec, const CeedMemType mem_type, const CeedScalar **array) {
return CeedVectorGetArrayCore_Hip(vec, mem_type, (CeedScalar **)array);
}
static int CeedVectorGetArray_Hip(const CeedVector vec, const CeedMemType mem_type, CeedScalar **array) {
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorGetArrayCore_Hip(vec, mem_type, array));
CeedCallBackend(CeedVectorSetAllInvalid_Hip(vec));
switch (mem_type) {
case CEED_MEM_HOST:
impl->h_array = *array;
break;
case CEED_MEM_DEVICE:
impl->d_array = *array;
break;
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorGetArrayWrite_Hip(const CeedVector vec, const CeedMemType mem_type, CeedScalar **array) {
bool has_array_of_type = true;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorHasArrayOfType_Hip(vec, mem_type, &has_array_of_type));
if (!has_array_of_type) {
CeedCallBackend(CeedVectorSetArray(vec, mem_type, CEED_COPY_VALUES, NULL));
} else {
switch (mem_type) {
case CEED_MEM_HOST:
if (impl->h_array_borrowed) impl->h_array = impl->h_array_borrowed;
else impl->h_array = impl->h_array_owned;
break;
case CEED_MEM_DEVICE:
if (impl->d_array_borrowed) impl->d_array = impl->d_array_borrowed;
else impl->d_array = impl->d_array_owned;
}
}
return CeedVectorGetArray_Hip(vec, mem_type, array);
}
static int CeedVectorNorm_Hip(CeedVector vec, CeedNormType type, CeedScalar *norm) {
Ceed ceed;
CeedSize length, num_calls;
const CeedScalar *d_array;
CeedVector_Hip *impl;
hipblasHandle_t handle;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorGetLength(vec, &length));
CeedCallBackend(CeedGetHipblasHandle_Hip(ceed, &handle));
num_calls = length / INT_MAX;
if (length % INT_MAX > 0) num_calls += 1;
CeedCallBackend(CeedVectorGetArrayRead(vec, CEED_MEM_DEVICE, &d_array));
switch (type) {
case CEED_NORM_1: {
*norm = 0.0;
if (CEED_SCALAR_TYPE == CEED_SCALAR_FP32) {
float sub_norm = 0.0;
float *d_array_start;
for (CeedInt i = 0; i < num_calls; i++) {
d_array_start = (float *)d_array + (CeedSize)(i)*INT_MAX;
CeedSize remaining_length = length - (CeedSize)(i)*INT_MAX;
CeedInt sub_length = (i == num_calls - 1) ? (CeedInt)(remaining_length) : INT_MAX;
CeedCallHipblas(ceed, hipblasSasum(handle, (CeedInt)sub_length, (float *)d_array_start, 1, &sub_norm));
*norm += sub_norm;
}
} else {
double sub_norm = 0.0;
double *d_array_start;
for (CeedInt i = 0; i < num_calls; i++) {
d_array_start = (double *)d_array + (CeedSize)(i)*INT_MAX;
CeedSize remaining_length = length - (CeedSize)(i)*INT_MAX;
CeedInt sub_length = (i == num_calls - 1) ? (CeedInt)(remaining_length) : INT_MAX;
CeedCallHipblas(ceed, hipblasDasum(handle, (CeedInt)sub_length, (double *)d_array_start, 1, &sub_norm));
*norm += sub_norm;
}
}
break;
}
case CEED_NORM_2: {
if (CEED_SCALAR_TYPE == CEED_SCALAR_FP32) {
float sub_norm = 0.0, norm_sum = 0.0;
float *d_array_start;
for (CeedInt i = 0; i < num_calls; i++) {
d_array_start = (float *)d_array + (CeedSize)(i)*INT_MAX;
CeedSize remaining_length = length - (CeedSize)(i)*INT_MAX;
CeedInt sub_length = (i == num_calls - 1) ? (CeedInt)(remaining_length) : INT_MAX;
CeedCallHipblas(ceed, hipblasSnrm2(handle, (CeedInt)sub_length, (float *)d_array_start, 1, &sub_norm));
norm_sum += sub_norm * sub_norm;
}
*norm = sqrt(norm_sum);
} else {
double sub_norm = 0.0, norm_sum = 0.0;
double *d_array_start;
for (CeedInt i = 0; i < num_calls; i++) {
d_array_start = (double *)d_array + (CeedSize)(i)*INT_MAX;
CeedSize remaining_length = length - (CeedSize)(i)*INT_MAX;
CeedInt sub_length = (i == num_calls - 1) ? (CeedInt)(remaining_length) : INT_MAX;
CeedCallHipblas(ceed, hipblasDnrm2(handle, (CeedInt)sub_length, (double *)d_array_start, 1, &sub_norm));
norm_sum += sub_norm * sub_norm;
}
*norm = sqrt(norm_sum);
}
break;
}
case CEED_NORM_MAX: {
CeedInt index;
if (CEED_SCALAR_TYPE == CEED_SCALAR_FP32) {
float sub_max = 0.0, current_max = 0.0;
float *d_array_start;
for (CeedInt i = 0; i < num_calls; i++) {
d_array_start = (float *)d_array + (CeedSize)(i)*INT_MAX;
CeedSize remaining_length = length - (CeedSize)(i)*INT_MAX;
CeedInt sub_length = (i == num_calls - 1) ? (CeedInt)(remaining_length) : INT_MAX;
CeedCallHipblas(ceed, hipblasIsamax(handle, (CeedInt)sub_length, (float *)d_array_start, 1, &index));
CeedCallHip(ceed, hipMemcpy(&sub_max, d_array_start + index - 1, sizeof(CeedScalar), hipMemcpyDeviceToHost));
if (fabs(sub_max) > current_max) current_max = fabs(sub_max);
}
*norm = current_max;
} else {
double sub_max = 0.0, current_max = 0.0;
double *d_array_start;
for (CeedInt i = 0; i < num_calls; i++) {
d_array_start = (double *)d_array + (CeedSize)(i)*INT_MAX;
CeedSize remaining_length = length - (CeedSize)(i)*INT_MAX;
CeedInt sub_length = (i == num_calls - 1) ? (CeedInt)(remaining_length) : INT_MAX;
CeedCallHipblas(ceed, hipblasIdamax(handle, (CeedInt)sub_length, (double *)d_array_start, 1, &index));
CeedCallHip(ceed, hipMemcpy(&sub_max, d_array_start + index - 1, sizeof(CeedScalar), hipMemcpyDeviceToHost));
if (fabs(sub_max) > current_max) current_max = fabs(sub_max);
}
*norm = current_max;
}
break;
}
}
CeedCallBackend(CeedVectorRestoreArrayRead(vec, &d_array));
return CEED_ERROR_SUCCESS;
}
static int CeedHostReciprocal_Hip(CeedScalar *h_array, CeedSize length) {
for (CeedSize i = 0; i < length; i++) {
if (fabs(h_array[i]) > CEED_EPSILON) h_array[i] = 1. / h_array[i];
}
return CEED_ERROR_SUCCESS;
}
int CeedDeviceReciprocal_Hip(CeedScalar *d_array, CeedSize length);
static int CeedVectorReciprocal_Hip(CeedVector vec) {
Ceed ceed;
CeedSize length;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallBackend(CeedVectorGetLength(vec, &length));
if (impl->d_array) CeedCallBackend(CeedDeviceReciprocal_Hip(impl->d_array, length));
if (impl->h_array) CeedCallBackend(CeedHostReciprocal_Hip(impl->h_array, length));
return CEED_ERROR_SUCCESS;
}
static int CeedHostScale_Hip(CeedScalar *x_array, CeedScalar alpha, CeedSize length) {
for (CeedSize i = 0; i < length; i++) x_array[i] *= alpha;
return CEED_ERROR_SUCCESS;
}
int CeedDeviceScale_Hip(CeedScalar *x_array, CeedScalar alpha, CeedSize length);
static int CeedVectorScale_Hip(CeedVector x, CeedScalar alpha) {
Ceed ceed;
CeedSize length;
CeedVector_Hip *x_impl;
CeedCallBackend(CeedVectorGetCeed(x, &ceed));
CeedCallBackend(CeedVectorGetData(x, &x_impl));
CeedCallBackend(CeedVectorGetLength(x, &length));
if (x_impl->d_array) CeedCallBackend(CeedDeviceScale_Hip(x_impl->d_array, alpha, length));
if (x_impl->h_array) CeedCallBackend(CeedHostScale_Hip(x_impl->h_array, alpha, length));
return CEED_ERROR_SUCCESS;
}
static int CeedHostAXPY_Hip(CeedScalar *y_array, CeedScalar alpha, CeedScalar *x_array, CeedSize length) {
for (CeedSize i = 0; i < length; i++) y_array[i] += alpha * x_array[i];
return CEED_ERROR_SUCCESS;
}
int CeedDeviceAXPY_Hip(CeedScalar *y_array, CeedScalar alpha, CeedScalar *x_array, CeedSize length);
static int CeedVectorAXPY_Hip(CeedVector y, CeedScalar alpha, CeedVector x) {
Ceed ceed;
CeedSize length;
CeedVector_Hip *y_impl, *x_impl;
CeedCallBackend(CeedVectorGetCeed(y, &ceed));
CeedCallBackend(CeedVectorGetData(y, &y_impl));
CeedCallBackend(CeedVectorGetData(x, &x_impl));
CeedCallBackend(CeedVectorGetLength(y, &length));
if (y_impl->d_array) {
CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_DEVICE));
CeedCallBackend(CeedDeviceAXPY_Hip(y_impl->d_array, alpha, x_impl->d_array, length));
}
if (y_impl->h_array) {
CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_HOST));
CeedCallBackend(CeedHostAXPY_Hip(y_impl->h_array, alpha, x_impl->h_array, length));
}
return CEED_ERROR_SUCCESS;
}
static int CeedHostAXPBY_Hip(CeedScalar *y_array, CeedScalar alpha, CeedScalar beta, CeedScalar *x_array, CeedSize length) {
for (CeedSize i = 0; i < length; i++) y_array[i] += alpha * x_array[i] + beta * y_array[i];
return CEED_ERROR_SUCCESS;
}
int CeedDeviceAXPBY_Hip(CeedScalar *y_array, CeedScalar alpha, CeedScalar beta, CeedScalar *x_array, CeedSize length);
static int CeedVectorAXPBY_Hip(CeedVector y, CeedScalar alpha, CeedScalar beta, CeedVector x) {
Ceed ceed;
CeedSize length;
CeedVector_Hip *y_impl, *x_impl;
CeedCallBackend(CeedVectorGetCeed(y, &ceed));
CeedCallBackend(CeedVectorGetData(y, &y_impl));
CeedCallBackend(CeedVectorGetData(x, &x_impl));
CeedCallBackend(CeedVectorGetLength(y, &length));
if (y_impl->d_array) {
CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_DEVICE));
CeedCallBackend(CeedDeviceAXPBY_Hip(y_impl->d_array, alpha, beta, x_impl->d_array, length));
}
if (y_impl->h_array) {
CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_HOST));
CeedCallBackend(CeedHostAXPBY_Hip(y_impl->h_array, alpha, beta, x_impl->h_array, length));
}
return CEED_ERROR_SUCCESS;
}
static int CeedHostPointwiseMult_Hip(CeedScalar *w_array, CeedScalar *x_array, CeedScalar *y_array, CeedSize length) {
for (CeedSize i = 0; i < length; i++) w_array[i] = x_array[i] * y_array[i];
return CEED_ERROR_SUCCESS;
}
int CeedDevicePointwiseMult_Hip(CeedScalar *w_array, CeedScalar *x_array, CeedScalar *y_array, CeedSize length);
static int CeedVectorPointwiseMult_Hip(CeedVector w, CeedVector x, CeedVector y) {
Ceed ceed;
CeedSize length;
CeedVector_Hip *w_impl, *x_impl, *y_impl;
CeedCallBackend(CeedVectorGetCeed(w, &ceed));
CeedCallBackend(CeedVectorGetData(w, &w_impl));
CeedCallBackend(CeedVectorGetData(x, &x_impl));
CeedCallBackend(CeedVectorGetData(y, &y_impl));
CeedCallBackend(CeedVectorGetLength(w, &length));
if (!w_impl->d_array && !w_impl->h_array) {
CeedCallBackend(CeedVectorSetValue(w, 0.0));
}
if (w_impl->d_array) {
CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_DEVICE));
CeedCallBackend(CeedVectorSyncArray(y, CEED_MEM_DEVICE));
CeedCallBackend(CeedDevicePointwiseMult_Hip(w_impl->d_array, x_impl->d_array, y_impl->d_array, length));
}
if (w_impl->h_array) {
CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_HOST));
CeedCallBackend(CeedVectorSyncArray(y, CEED_MEM_HOST));
CeedCallBackend(CeedHostPointwiseMult_Hip(w_impl->h_array, x_impl->h_array, y_impl->h_array, length));
}
return CEED_ERROR_SUCCESS;
}
static int CeedVectorDestroy_Hip(const CeedVector vec) {
Ceed ceed;
CeedVector_Hip *impl;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedVectorGetData(vec, &impl));
CeedCallHip(ceed, hipFree(impl->d_array_owned));
CeedCallBackend(CeedFree(&impl->h_array_owned));
CeedCallBackend(CeedFree(&impl));
return CEED_ERROR_SUCCESS;
}
int CeedVectorCreate_Hip(CeedSize n, CeedVector vec) {
CeedVector_Hip *impl;
Ceed ceed;
CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "HasValidArray", CeedVectorHasValidArray_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "HasBorrowedArrayOfType", CeedVectorHasBorrowedArrayOfType_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "SetArray", CeedVectorSetArray_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "TakeArray", CeedVectorTakeArray_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "SetValue", (int (*)())CeedVectorSetValue_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "SyncArray", CeedVectorSyncArray_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "GetArray", CeedVectorGetArray_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayRead", CeedVectorGetArrayRead_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "GetArrayWrite", CeedVectorGetArrayWrite_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "Norm", CeedVectorNorm_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "Reciprocal", CeedVectorReciprocal_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "Scale", (int (*)())CeedVectorScale_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "AXPY", (int (*)())CeedVectorAXPY_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "AXPBY", (int (*)())CeedVectorAXPBY_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "PointwiseMult", CeedVectorPointwiseMult_Hip));
CeedCallBackend(CeedSetBackendFunction(ceed, "Vector", vec, "Destroy", CeedVectorDestroy_Hip));
CeedCallBackend(CeedCalloc(1, &impl));
CeedCallBackend(CeedVectorSetData(vec, impl));
return CEED_ERROR_SUCCESS;
}