PSCF v1.2
HostDArray.h
1#ifndef PSCF_HOST_D_ARRAY_H
2#define PSCF_HOST_D_ARRAY_H
3
4/*
5* PSCF Package
6*
7* Copyright 2016 - 2022, The Regents of the University of Minnesota
8* Distributed under the terms of the GNU General Public License.
9*/
10
11#include "DeviceArray.h"
12#include "cudaErrorCheck.h"
13#include <util/containers/DArray.h>
14#include <util/global.h>
15#include <cuda_runtime.h>
16
17namespace Pscf {
18
19 using namespace Util;
20
41 template <typename Data>
42 class HostDArray : public DArray<Data>
43 {
44
45 public:
46
50 typedef Data ElementType;
51
56
65
71 HostDArray(DArray<Data> const & other);
72
78 virtual ~HostDArray();
79
97 virtual
99
115 void copySlice(DeviceArray<Data> const & other, int beginId);
116
117 };
118
119 /*
120 * Default constructor.
121 */
122 template <typename Data>
124 : DArray<Data>()
125 {}
126
127 /*
128 * Allocating constructor.
129 */
130 template <typename Data>
134
135 /*
136 * Copy constructor. (Copies from any DArray or HostDArray).
137 */
138 template <typename Data>
140 : DArray<Data>(other) // Use DArray base class copy constructor
141 {}
142
143 /*
144 * Destructor.
145 */
146 template <typename Data>
148 {} // DArray base class destructor will deallocate memory
149
150 /*
151 * Assignment from a DeviceArray<Data> RHS device array.
152 */
153 template <typename Data>
156 {
157 // Precondition - RHS array must be allocated
158 if (!other.isAllocated()) {
159 UTIL_THROW("RHS DeviceArray<Data> must be allocated.");
160 }
161
162 // Allocate this if necessary
165 }
166
167 // Require equal capacities
168 if (DArray<Data>::capacity() != other.capacity()) {
169 UTIL_THROW("Cannot assign arrays of unequal capacity");
170 }
171
172 // Copy all elements
173 cudaErrorCheck( cudaMemcpy(DArray<Data>::cArray(), other.cArray(),
174 DArray<Data>::capacity() * sizeof(Data),
175 cudaMemcpyDeviceToHost) );
176
177 return *this;
178 }
179
180 /*
181 * Copy a slice of the data from a larger DeviceArray into this array.
182 */
183 template <typename Data>
185 int beginId)
186 {
187 // Precondition - device array must be allocated
188 if (!other.isAllocated()) {
189 UTIL_THROW("RHS DeviceArray<Data> must be allocated.");
190 }
191
192 // Precondition - host array must be allocated
194 UTIL_THROW("LHS HostDArray<Data> must be allocated.");
195 }
196
197 // Slice must not exceed the capacity of device array
198 if (DArray<Data>::capacity() + beginId > other.capacity()) {
199 UTIL_THROW("Slice must not exceed the capacity of device array.");
200 }
201
202 // Copy all elements
203 cudaErrorCheck( cudaMemcpy(DArray<Data>::cArray(),
204 other.cArray() + beginId,
205 DArray<Data>::capacity() * sizeof(Data),
206 cudaMemcpyDeviceToHost) );
207 }
208
209}
210#endif
Dynamic array on the GPU device with aligned data.
Definition rpg/System.h:32
bool isAllocated() const
Return true if the array has been allocated, false otherwise.
int capacity() const
Return allocated capacity.
Data * cArray()
Return pointer to underlying C array.
Template for dynamic array stored in host CPU memory.
Definition HostDArray.h:43
void copySlice(DeviceArray< Data > const &other, int beginId)
Copy a slice of the data from a larger DeviceArray into this array.
Definition HostDArray.h:184
HostDArray()
Default constructor.
Definition HostDArray.h:123
HostDArray(int capacity)
Allocating constructor.
Definition HostDArray.h:131
virtual ~HostDArray()
Destructor.
Definition HostDArray.h:147
Data ElementType
Data type of each element.
Definition HostDArray.h:50
virtual HostDArray< Data > & operator=(const DeviceArray< Data > &other)
Assignment operator, assign from DeviceArray<Data> device array.
Definition HostDArray.h:155
HostDArray(DArray< Data > const &other)
Copy constructor.
Definition HostDArray.h:139
int capacity() const
Return allocated size.
Definition Array.h:159
Dynamically allocatable contiguous array template.
void allocate(int capacity)
Allocate the underlying C array.
Definition DArray.h:199
File containing preprocessor macros for error handling.
#define UTIL_THROW(msg)
Macro for throwing an Exception, reporting function, file and line number.
Definition global.h:51
PSCF package top-level namespace.
Definition param_pc.dox:1
Utility classes for scientific computation.