1#ifndef PSCF_DEVICE_ARRAY_H
2#define PSCF_DEVICE_ARRAY_H
11#include "cudaErrorCheck.h"
13#include <cuda_runtime.h>
20 template <
typename Data>
class HostDArray;
41 template <
typename Data>
209 template <
typename Data>
215 ownerDataPtr_(nullptr)
221 template <
typename Data>
227 ownerDataPtr_(nullptr)
235 template <
typename Data>
238 if (!other.isAllocated()) {
242 allocate(other.capacity_);
243 cudaErrorCheck( cudaMemcpy(dataPtr_, other.cArray(),
244 capacity_ *
sizeof(Data),
245 cudaMemcpyDeviceToDevice) );
251 template <
typename Data>
254 if (isAllocated() && isOwner()) {
255 cudaErrorCheck( cudaFree(dataPtr_) );
263 template <
typename Data>
267 UTIL_THROW(
"Attempt to re-allocate an array");
270 UTIL_THROW(
"Attempt to allocate array already associated with data");
273 UTIL_THROW(
"Attempt to allocate with capacity <= 0");
275 cudaErrorCheck( cudaMalloc((
void**) &dataPtr_, capacity *
sizeof(Data)) );
276 capacity_ = capacity;
284 template <
typename Data>
292 UTIL_CHECK(beginId + capacity <= arr.capacity());
295 UTIL_THROW(
"Attempt to associate an already-allocated array.");
298 dataPtr_ = arr.cArray() + beginId;
299 capacity_ = capacity;
301 ownerCapacity_ = arr.capacity();
302 ownerDataPtr_ = arr.cArray();
310 template <
typename Data>
313 if (!isAllocated()) {
317 UTIL_THROW(
"Cannot deallocate, data not owned by this object.");
319 cudaErrorCheck( cudaFree(dataPtr_) );
329 template <
typename Data>
333 UTIL_THROW(
"Cannot dissociate: this object owns the array.");
335 if (!isAllocated()) {
336 UTIL_THROW(
"Cannot dissociate: no associated data found.");
342 ownerDataPtr_ =
nullptr;
348 template <
typename Data>
353 if (
this == &other)
return *
this;
356 if (!other.isAllocated()) {
357 UTIL_THROW(
"Other DeviceArray<Data> must be allocated.");
361 if (!isAllocated()) {
362 allocate(other.capacity());
366 if (capacity_ != other.capacity_) {
367 UTIL_THROW(
"Cannot assign arrays of unequal capacity");
371 cudaErrorCheck( cudaMemcpy(dataPtr_, other.cArray(),
372 capacity_ *
sizeof(Data),
373 cudaMemcpyDeviceToDevice) );
381 template <
typename Data>
387 UTIL_THROW(
"RHS HostDArray<Data> must be allocated.");
391 if (!isAllocated()) {
396 if (capacity_ != other.
capacity()) {
397 UTIL_THROW(
"Cannot assign arrays of unequal capacity");
401 cudaErrorCheck( cudaMemcpy(dataPtr_, other.
cArray(),
402 capacity_ *
sizeof(Data),
403 cudaMemcpyHostToDevice) );
411 template <
typename Data>
417 UTIL_CHECK(ownerPtr_->capacity() == ownerCapacity_);
418 UTIL_CHECK(ownerPtr_->cArray() == ownerDataPtr_);
427 template <
typename Data>
433 UTIL_CHECK(ownerPtr_->capacity() == ownerCapacity_);
434 UTIL_CHECK(ownerPtr_->cArray() == ownerDataPtr_);
443 template <
typename Data>
449 UTIL_CHECK(ownerPtr_->capacity() == ownerCapacity_);
450 UTIL_CHECK(ownerPtr_->cArray() == ownerDataPtr_);
453 return (
bool)dataPtr_;
459 template <
typename Data>
461 {
return capacity_; }
466 template <
typename Data>
468 {
return ((
nullptr == ownerPtr_) && (
nullptr != dataPtr_)); }
Dynamic array on the GPU device with aligned data.
DeviceArray()
Default constructor.
bool isOwner() const
Does this object own the underlying data?
DeviceArray< Data > const * ownerPtr_
Pointer to array that owns this data, if isOwner_ == false.
void deallocate()
Dellocate the underlying C array.
DeviceArray(int capacity)
Allocating constructor.
int capacity_
Allocated size (capacity) of the array.
void dissociate()
Dissociate this object from the associated array.
virtual ~DeviceArray()
Destructor.
int ownerCapacity_
Capacity of parent array, if isOwner_ == false.
Data const * ownerDataPtr_
Const pointer to parent array, if isOwner_ == false.
virtual DeviceArray< Data > & operator=(const DeviceArray< Data > &other)
Assignment operator, assign from another DeviceArray<Data> array.
bool isAllocated() const
Return true if the array has been allocated, false otherwise.
void associate(DeviceArray< Data > &arr, int beginId, int capacity)
Associate this object with a slice of a different DeviceArray.
int capacity() const
Return allocated capacity.
Data * dataPtr_
Pointer to a C array of Data elements on the GPU device.
DeviceArray(DeviceArray< Data > const &other)
Copy constructor.
Data ElementType
Data type of each element.
void allocate(int capacity)
Allocate the underlying C array on the device.
Data const * cArray() const
Return const pointer to underlying C array.
Data * cArray()
Return pointer to underlying C array.
Template for dynamic array stored in host CPU memory.
Data * cArray()
Return a pointer to the underlying C array.
int capacity() const
Return allocated size.
bool isAllocated() const
Return true if this DArray has been allocated, false otherwise.
File containing preprocessor macros for error handling.
#define UTIL_CHECK(condition)
Assertion macro suitable for serial or parallel production code.
#define UTIL_THROW(msg)
Macro for throwing an Exception, reporting function, file and line number.
PSCF package top-level namespace.
Utility classes for scientific computation.