PSCF v1.2
DeviceArray.h
1#ifndef PSCF_DEVICE_ARRAY_H
2#define PSCF_DEVICE_ARRAY_H
3
4/*
5* PSCF Package
6*
7* Copyright 2016 - 2022, The Regents of the University of Minnesota
8* Distributed under the terms of the GNU General Public License.
9*/
10
11#include "cudaErrorCheck.h"
12#include <util/global.h>
13#include <cuda_runtime.h>
14
15namespace Pscf {
16
17 using namespace Util;
18
19 // Forward declaration of analogous container for data on host.
20 template <typename Data> class HostDArray;
21
41 template <typename Data>
42 class DeviceArray
43 {
44
45 public:
46
50 typedef Data ElementType;
51
56
65
72
78 virtual ~DeviceArray();
79
87 void allocate(int capacity);
88
98 void associate(DeviceArray<Data>& arr, int beginId, int capacity);
99
107
114
127 virtual
129
143 virtual
145
151 int capacity() const;
152
156 bool isAllocated() const;
157
161 bool isOwner() const;
162
166 Data* cArray();
167
171 Data const * cArray() const;
172
173 protected:
174
176 Data* dataPtr_;
177
180
188
196
203 Data const * ownerDataPtr_;
204 };
205
206 /*
207 * Default constructor.
208 */
209 template <typename Data>
211 : dataPtr_(nullptr),
212 capacity_(0),
213 ownerPtr_(nullptr),
214 ownerCapacity_(0),
215 ownerDataPtr_(nullptr)
216 {}
217
218 /*
219 * Allocating constructor.
220 */
221 template <typename Data>
223 : dataPtr_(nullptr),
224 capacity_(0),
225 ownerPtr_(nullptr),
226 ownerCapacity_(0),
227 ownerDataPtr_(nullptr)
228 { allocate(capacity); }
229
230 /*
231 * Copy constructor.
232 *
233 * Allocates new memory and copies all elements by value.
234 */
235 template <typename Data>
237 {
238 if (!other.isAllocated()) {
239 UTIL_THROW("Other array must be allocated.");
240 }
241
242 allocate(other.capacity_);
243 cudaErrorCheck( cudaMemcpy(dataPtr_, other.cArray(),
244 capacity_ * sizeof(Data),
245 cudaMemcpyDeviceToDevice) );
246 }
247
248 /*
249 * Destructor.
250 */
251 template <typename Data>
253 {
254 if (isAllocated() && isOwner()) {
255 cudaErrorCheck( cudaFree(dataPtr_) );
256 capacity_ = 0;
257 }
258 }
259
260 /*
261 * Allocate the underlying C array.
262 */
263 template <typename Data>
265 {
266 if (isAllocated()) {
267 UTIL_THROW("Attempt to re-allocate an array");
268 }
269 if (ownerPtr_) {
270 UTIL_THROW("Attempt to allocate array already associated with data");
271 }
272 if (capacity <= 0) {
273 UTIL_THROW("Attempt to allocate with capacity <= 0");
274 }
275 cudaErrorCheck( cudaMalloc((void**) &dataPtr_, capacity * sizeof(Data)) );
276 capacity_ = capacity;
277
278 ownerPtr_ = nullptr;
279 }
280
281 /*
282 * Associate this object with a slice of a different DeviceArray.
283 */
284 template <typename Data>
286 int capacity)
287 {
288 UTIL_CHECK(arr.isAllocated());
289 UTIL_CHECK(arr.isOwner());
290 UTIL_CHECK(beginId >= 0);
291 UTIL_CHECK(capacity > 0);
292 UTIL_CHECK(beginId + capacity <= arr.capacity());
293
294 if (isAllocated()) {
295 UTIL_THROW("Attempt to associate an already-allocated array.");
296 }
297
298 dataPtr_ = arr.cArray() + beginId;
299 capacity_ = capacity;
300 ownerPtr_ = &arr;
301 ownerCapacity_ = arr.capacity();
302 ownerDataPtr_ = arr.cArray();
303 }
304
305 /*
306 * Deallocate the underlying C array.
307 *
308 * Throw an Exception if this array is not allocated.
309 */
310 template <typename Data>
312 {
313 if (!isAllocated()) {
314 UTIL_THROW("Array is not allocated");
315 }
316 if (!isOwner()) {
317 UTIL_THROW("Cannot deallocate, data not owned by this object.");
318 }
319 cudaErrorCheck( cudaFree(dataPtr_) );
320 dataPtr_ = nullptr; // reset to null
321 capacity_ = 0;
322 }
323
324 /*
325 * Dissociate this object from the associated array.
326 *
327 * Throw Exception if this object is not associated with another array.
328 */
329 template <typename Data>
331 {
332 if (isOwner()) {
333 UTIL_THROW("Cannot dissociate: this object owns the array.");
334 }
335 if (!isAllocated()) {
336 UTIL_THROW("Cannot dissociate: no associated data found.");
337 }
338 dataPtr_ = nullptr; // reset to null
339 capacity_ = 0;
340 ownerPtr_ = nullptr; // reset to null
341 ownerCapacity_ = 0;
342 ownerDataPtr_ = nullptr;
343 }
344
345 /*
346 * Assignment from another DeviceArray<Data>.
347 */
348 template <typename Data>
351 {
352 // Check for self assignment
353 if (this == &other) return *this;
354
355 // Precondition - RHS DeviceArray<Data> must be allocated
356 if (!other.isAllocated()) {
357 UTIL_THROW("Other DeviceArray<Data> must be allocated.");
358 }
359
360 // If this is not allocated, then allocate
361 if (!isAllocated()) {
362 allocate(other.capacity());
363 }
364
365 // Require equal capacity values
366 if (capacity_ != other.capacity_) {
367 UTIL_THROW("Cannot assign arrays of unequal capacity");
368 }
369
370 // Copy elements
371 cudaErrorCheck( cudaMemcpy(dataPtr_, other.cArray(),
372 capacity_ * sizeof(Data),
373 cudaMemcpyDeviceToDevice) );
374
375 return *this;
376 }
377
378 /*
379 * Assignment of LHS DeviceArray<Data> from RHS HostDArray<Data>.
380 */
381 template <typename Data>
384 {
385 // Precondition
386 if (!other.isAllocated()) {
387 UTIL_THROW("RHS HostDArray<Data> must be allocated.");
388 }
389
390 // Allocate this if necessary
391 if (!isAllocated()) {
392 allocate(other.capacity());
393 }
394
395 // Require equal capacity values
396 if (capacity_ != other.capacity()) {
397 UTIL_THROW("Cannot assign arrays of unequal capacity");
398 }
399
400 // Copy elements
401 cudaErrorCheck( cudaMemcpy(dataPtr_, other.cArray(),
402 capacity_ * sizeof(Data),
403 cudaMemcpyHostToDevice) );
404
405 return *this;
406 }
407
408 /*
409 * Get a pointer to the underlying C array.
410 */
411 template <typename Data>
413 {
414 // Make sure that owner array has not been deallocated / reallocated
415 if (ownerPtr_) {
416 UTIL_CHECK(ownerPtr_->isAllocated());
417 UTIL_CHECK(ownerPtr_->capacity() == ownerCapacity_);
418 UTIL_CHECK(ownerPtr_->cArray() == ownerDataPtr_);
419 }
420
421 return dataPtr_;
422 }
423
424 /*
425 * Get a pointer to const to the underlying C array.
426 */
427 template <typename Data>
428 const Data* DeviceArray<Data>::cArray() const
429 {
430 // Make sure that owner array has not been deallocated / reallocated
431 if (ownerPtr_) {
432 UTIL_CHECK(ownerPtr_->isAllocated());
433 UTIL_CHECK(ownerPtr_->capacity() == ownerCapacity_);
434 UTIL_CHECK(ownerPtr_->cArray() == ownerDataPtr_);
435 }
436
437 return dataPtr_;
438 }
439
440 /*
441 * Return true if the array has been allocated, false otherwise.
442 */
443 template <typename Data>
445 {
446 // Make sure that owner array has not been deallocated / reallocated
447 if (ownerPtr_) {
448 UTIL_CHECK(ownerPtr_->isAllocated());
449 UTIL_CHECK(ownerPtr_->capacity() == ownerCapacity_);
450 UTIL_CHECK(ownerPtr_->cArray() == ownerDataPtr_);
451 }
452
453 return (bool)dataPtr_;
454 }
455
456 /*
457 * Return allocated capacity.
458 */
459 template <typename Data>
461 { return capacity_; }
462
463 /*
464 * Does this object own the underlying data?
465 */
466 template <typename Data>
467 inline bool DeviceArray<Data>::isOwner() const
468 { return ((nullptr == ownerPtr_) && (nullptr != dataPtr_)); }
469
470} // namespace Pscf
471#endif
Dynamic array on the GPU device with aligned data.
Definition rpg/System.h:32
DeviceArray()
Default constructor.
bool isOwner() const
Does this object own the underlying data?
DeviceArray< Data > const * ownerPtr_
Pointer to array that owns this data, if isOwner_ == false.
void deallocate()
Dellocate the underlying C array.
DeviceArray(int capacity)
Allocating constructor.
int capacity_
Allocated size (capacity) of the array.
void dissociate()
Dissociate this object from the associated array.
virtual ~DeviceArray()
Destructor.
int ownerCapacity_
Capacity of parent array, if isOwner_ == false.
Data const * ownerDataPtr_
Const pointer to parent array, if isOwner_ == false.
virtual DeviceArray< Data > & operator=(const DeviceArray< Data > &other)
Assignment operator, assign from another DeviceArray<Data> array.
bool isAllocated() const
Return true if the array has been allocated, false otherwise.
void associate(DeviceArray< Data > &arr, int beginId, int capacity)
Associate this object with a slice of a different DeviceArray.
int capacity() const
Return allocated capacity.
Data * dataPtr_
Pointer to a C array of Data elements on the GPU device.
DeviceArray(DeviceArray< Data > const &other)
Copy constructor.
Data ElementType
Data type of each element.
Definition DeviceArray.h:50
void allocate(int capacity)
Allocate the underlying C array on the device.
Data const * cArray() const
Return const pointer to underlying C array.
Data * cArray()
Return pointer to underlying C array.
Template for dynamic array stored in host CPU memory.
Definition HostDArray.h:43
Data * cArray()
Return a pointer to the underlying C array.
Definition Array.h:214
int capacity() const
Return allocated size.
Definition Array.h:159
bool isAllocated() const
Return true if this DArray has been allocated, false otherwise.
Definition DArray.h:247
File containing preprocessor macros for error handling.
#define UTIL_CHECK(condition)
Assertion macro suitable for serial or parallel production code.
Definition global.h:68
#define UTIL_THROW(msg)
Macro for throwing an Exception, reporting function, file and line number.
Definition global.h:51
PSCF package top-level namespace.
Definition param_pc.dox:1
Utility classes for scientific computation.