PSCF v1.2
LrAmPreCompressor.tpp
1#ifndef RPG_LR_AM_COMPRESSOR_TPP
2#define RPG_LR_AM_COMPRESSOR_TPP
3
4/*
5* PSCF - Polymer Self-Consistent Field Theory
6*
7* Copyright 2016 - 2022, The Regents of the University of Minnesota
8* Distributed under the terms of the GNU General Public License.
9*/
10
11#include "LrAmPreCompressor.h"
12#include <rpg/System.h>
13#include <rpg/fts/compressor/intra/IntraCorrelation.h>
14#include <prdc/crystal/shiftToMinimum.h>
15#include <prdc/cuda/resources.h>
16#include <pscf/chem/Monomer.h>
17#include <pscf/mesh/MeshIterator.h>
18#include <complex>
19#include <util/global.h>
20
21namespace Pscf {
22namespace Rpg {
23
24 using namespace Util;
25
26 // Constructor
27 template <int D>
29 : Compressor<D>(system),
30 isAllocated_(false),
31 intra_(system)
32 { setClassName("LrAmPreCompressor"); }
33
34 // Destructor
35 template <int D>
38
39 // Read parameters from file
40 template <int D>
42 {
43 // Call parent class readParameters
46 }
47
48 // Initialize just before entry to iterative loop.
49 template <int D>
50 void LrAmPreCompressor<D>::setup(bool isContinuation)
51 {
52 const int nMonomer = system().mixture().nMonomer();
53 const int meshSize = system().domain().mesh().size();
54 IntVec<D> const & dimensions = system().mesh().dimensions();
55
56 // Allocate memory required by AM algorithm if not done earlier.
58 DeviceArray<cudaReal> >::setup(isContinuation);
59
60 // Compute Fourier space kMeshDimensions_
61 for (int i = 0; i < D; ++i) {
62 if (i < D - 1) {
63 kMeshDimensions_[i] = dimensions[i];
64 } else {
65 kMeshDimensions_[i] = dimensions[i]/2 + 1;
66 }
67 }
68
69 // Compute number of points in k-space grid
70 kSize_ = 1;
71 for (int i = 0; i < D; ++i) {
72 kSize_ *= kMeshDimensions_[i];
73 }
74
75 // Allocate memory required by compressor if not done earlier.
76 if (!isAllocated_){
77 w0_.allocate(nMonomer);
78 wFieldTmp_.allocate(nMonomer);
79 error_.allocate(dimensions);
80 resid_.allocate(dimensions);
81 residK_.allocate(dimensions);
82 intraCorrelation_.allocate(kMeshDimensions_);
83 for (int i = 0; i < nMonomer; ++i) {
84 w0_[i].allocate(dimensions);
85 wFieldTmp_[i].allocate(dimensions);
86 }
87 isAllocated_ = true;
88 }
89
90 // Store value of initial guess chemical potential fields
91 for (int i = 0; i < nMonomer; ++i) {
92 VecOp::eqV(w0_[i], system().w().rgrid(i));
93 }
94
95 // Compute intramolecular correlation
96 intraCorrelation_ = intra_.computeIntraCorrelations();
97 }
98
99 // Iterative solver (AM algorithm)
100 template <int D>
102 {
103 int solve = AmIteratorTmpl<Compressor<D>,
104 DeviceArray<cudaReal> >::solve();
105 //mdeCounter_ = AmIteratorTmpl<Compressor<D>, DeviceArray<cudaReal>>::totalItr();
106 return solve;
107 }
108
109 // Assign one array to another
110 template <int D>
112 DeviceArray<cudaReal> const & b)
113 {
114 UTIL_CHECK(b.capacity() == a.capacity());
115 VecOp::eqV(a, b);
116 }
117
118 // Compute and return inner product of two vectors.
119 template <int D>
120 double LrAmPreCompressor<D>::dotProduct(DeviceArray<cudaReal> const & a,
121 DeviceArray<cudaReal> const & b)
122 {
123 UTIL_CHECK(a.capacity() == b.capacity());
124 return Reduce::innerProduct(a, b);
125 }
126
127 // Compute and return maximum element of a vector.
128 template <int D>
129 double LrAmPreCompressor<D>::maxAbs(DeviceArray<cudaReal> const & a)
130 {
131 return Reduce::maxAbs(a);
132 }
133
134 // Update basis
135 template <int D>
136 void
137 LrAmPreCompressor<D>::updateBasis(RingBuffer< DeviceArray<cudaReal> > & basis,
138 RingBuffer< DeviceArray<cudaReal> > const & hists)
139 {
140 // Make sure at least two histories are stored
141 UTIL_CHECK(hists.size() >= 2);
142
143 basis.advance();
144 if (basis[0].isAllocated()) {
145 UTIL_CHECK(basis[0].capacity() == hists[0].capacity());
146 } else {
147 basis[0].allocate(hists[0].capacity());
148 }
149
150 VecOp::subVV(basis[0], hists[0], hists[1]);
151 }
152
153 template <int D>
154 void
155 LrAmPreCompressor<D>::addHistories(DeviceArray<cudaReal>& trial,
156 RingBuffer<DeviceArray<cudaReal> > const & basis,
157 DArray<double> coeffs,
158 int nHist)
159 {
160 for (int i = 0; i < nHist; i++) {
161 VecOp::addEqVc(trial, basis[i], -1.0 * coeffs[i]);
162 }
163 }
164
165 template <int D>
166 void
167 LrAmPreCompressor<D>::addPredictedError(DeviceArray<cudaReal>& fieldTrial,
168 DeviceArray<cudaReal> const & resTrial,
169 double lambda)
170 {
171 VecOp::addEqVc(fieldTrial, resTrial, lambda);
172 }
173
174 // Does the system have an initial field guess?
175 template <int D>
176 bool LrAmPreCompressor<D>::hasInitialGuess()
177 { return system().w().hasData(); }
178
179 // Compute and return the number of elements in a field vector
180 template <int D>
181 int LrAmPreCompressor<D>::nElements()
182 { return system().domain().mesh().size(); }
183
184 // Get the current field from the system
185 template <int D>
186 void LrAmPreCompressor<D>::getCurrent(DeviceArray<cudaReal>& curr)
187 {
188 /*
189 * The field that we are adjusting is the Langrange multiplier field
190 * with number of grid pts components.The current value is the difference
191 * between w and w0_ for the first monomer (any monomer should give the
192 * same answer)
193 */
194 VecOp::subVV(curr, system().w().rgrid(0), w0_[0]);
195 }
196
197 // Perform the main system computation (solve the MDE)
198 template <int D>
199 void LrAmPreCompressor<D>::evaluate()
200 {
201 system().compute();
202 ++mdeCounter_;
203 }
204
205 // Compute the residual for the current system state
206 template <int D>
207 void LrAmPreCompressor<D>::getResidual(DeviceArray<cudaReal>& resid)
208 {
209 const int nMonomer = system().mixture().nMonomer();
210 const double vMonomer = system().mixture().vMonomer();
211
212 // Compute incompressibility constraint error vector elements
213 VecOp::subVS(resid_, system().c().rgrid(0), 1.0);
214 for (int i = 1; i < nMonomer; i++) {
215 VecOp::addEqV(resid_, system().c().rgrid(i));
216 }
217
218 // Convert residual to Fourier Space
219 system().fft().forwardTransform(resid_, residK_);
220
221 // Residual combine with Linear response factor
222 VecOp::divEqVc(residK_, intraCorrelation_, vMonomer);
223
224 // Convert back to real Space (destroys residK_)
225 system().fft().inverseTransformUnsafe(residK_, resid_);
226
227 // Assign resid_ to resid
228 VecOp::eqV(resid, resid_);
229
230 }
231
232 // Update the current system field coordinates
233 template <int D>
234 void LrAmPreCompressor<D>::update(DeviceArray<cudaReal>& newGuess)
235 {
236 // Convert back to field format
237 const int nMonomer = system().mixture().nMonomer();
238
239 // New field is the w0_ + the newGuess for the Lagrange multiplier field
240 for (int i = 0; i < nMonomer; i++) {
241 VecOp::addVV(wFieldTmp_[i], w0_[i], newGuess);
242 }
243
244 // Set system r grid
245 system().setWRGrid(wFieldTmp_);
246 }
247
248 template<int D>
249 void LrAmPreCompressor<D>::outputToLog()
250 {}
251
252 template<int D>
254 {
255 // Output timing results, if requested.
256 out << "\n";
257 out << "Compressor times contributions:\n";
259 }
260
261
262 template<int D>
264 {
266 mdeCounter_ = 0;
267 }
268
269 template<int D>
271 {
272 return 1.0;
273 }
274
275 template<int D>
277 DeviceArray<cudaReal>& fieldTrial,
278 std::string errorType,
279 int verbose)
280 {
281 double error = 0.0;
282 const int n = nElements();
283 const int nMonomer = system().mixture().nMonomer();
284
285 // Initialize residuals to sum of all monomer compositions minus 1
286 VecOp::subVS(error_, system().c().rgrid(0), 1.0);
287 for (int i = 1; i < nMonomer; i++) {
288 VecOp::addEqV(error_, system().c().rgrid(i));
289 }
290
291 // Find max residual vector element
292 double maxRes = maxAbs(error_);
293
294 // Find norm of residual vector
295 double normRes = AmIteratorTmpl<Compressor<D>,
296 DeviceArray<cudaReal> >::norm(error_);
297
298 // Find root-mean-squared residual element value
299 double rmsRes = normRes/sqrt(n);
300 if (verbose > 1) {
301 Log::file() << "\n";
302 Log::file() << "Max Residual = " << Dbl(maxRes,15) << "\n";
303 Log::file() << "Residual Norm = " << Dbl(normRes,15) << "\n";
304 Log::file() << "RMS Residual = " << Dbl(rmsRes,15);
305
306 // Check if calculation has diverged (normRes will be NaN)
307 UTIL_CHECK(!std::isnan(normRes));
308 error = normRes;
309 Log::file() <<"\n";
310 // Set error value
311 if (errorType == "maxResid") {
312 error = maxRes;
313 } else if (errorType == "normResid") {
314 error = normRes;
315 } else if (errorType == "rmsResid") {
316 error = rmsRes;
317 } else {
318 UTIL_THROW("Invalid iterator error type in parameter file.");
319 }
320
321 } else {
322 // Set error value
323 if (errorType == "maxResid") {
324 error = maxRes;
325 } else if (errorType == "normResid") {
326 error = normRes;
327 } else if (errorType == "rmsResid") {
328 error = normRes/sqrt(n);
329 } else {
330 UTIL_THROW("Invalid iterator error type in parameter file.");
331 }
332 //Log::file() << ", error = " << Dbl(error, 15) << "\n";
333 }
334
335 return error;
336 }
337
338}
339}
340#endif
Template for Anderson mixing iterator algorithm.
Dynamic array on the GPU device with aligned data.
Definition rpg/System.h:32
int capacity() const
Return allocated capacity.
An IntVec<D, T> is a D-component vector of elements of integer type T.
Definition IntVec.h:27
Base class for iterators that impose incompressibility.
Anderson Mixing compressor with linear-response preconditioning.
LrAmPreCompressor(System< D > &system)
Constructor.
double computeError(DeviceArray< cudaReal > &residTrial, DeviceArray< cudaReal > &fieldTrial, std::string errorType, int verbose)
Compute and return error used to test for convergence.
void readParameters(std::istream &in)
Read all parameters and initialize.
void setup(bool isContinuation)
Initialize just before entry to iterative loop.
void clearTimers()
Reset / clear all timers.
int compress()
Compress to obtain partial saddle point w+.
void outputTimers(std::ostream &out)
Write a report of time contributions used by this algorithm.
Main class for calculations that represent one system.
Definition rpg/System.h:107
Dynamically allocatable contiguous array template.
Wrapper for a double precision number, for formatted ostream output.
Definition Dbl.h:40
static std::ostream & file()
Get log ostream by reference.
Definition Log.cpp:57
Class for storing history of previous values in an array.
Definition RingBuffer.h:27
File containing preprocessor macros for error handling.
#define UTIL_CHECK(condition)
Assertion macro suitable for serial or parallel production code.
Definition global.h:68
#define UTIL_THROW(msg)
Macro for throwing an Exception, reporting function, file and line number.
Definition global.h:51
cudaReal innerProduct(DeviceArray< cudaReal > const &a, DeviceArray< cudaReal > const &b)
Compute inner product of two real arrays (GPU kernel wrapper).
Definition Reduce.cu:891
cudaReal maxAbs(DeviceArray< cudaReal > const &in)
Get maximum absolute magnitude of array elements (GPU kernel wrapper).
Definition Reduce.cu:648
void addEqV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, const int beginIdA, const int beginIdB, const int n)
Vector addition in-place, a[i] += b[i], kernel wrapper (cudaReal).
Definition VecOp.cu:1632
void eqV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, const int beginIdA, const int beginIdB, const int n)
Vector assignment, a[i] = b[i], kernel wrapper (cudaReal).
Definition VecOp.cu:1020
void subVS(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c, const int beginIdA, const int beginIdB, const int n)
Vector subtraction, a[i] = b[i] - c, kernel wrapper (cudaReal).
Definition VecOp.cu:1304
void addVV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, DeviceArray< cudaReal > const &c, const int beginIdA, const int beginIdB, const int beginIdC, const int n)
Vector addition, a[i] = b[i] + c[i], kernel wrapper (cudaReal).
Definition VecOp.cu:1084
void subVV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, DeviceArray< cudaReal > const &c, const int beginIdA, const int beginIdB, const int beginIdC, const int n)
Vector subtraction, a[i] = b[i] - c[i], kernel wrapper (cudaReal).
Definition VecOp.cu:1228
void divEqVc(DeviceArray< cudaComplex > &a, DeviceArray< cudaReal > const &b, cudaReal const c)
Vector division in-place w/ coeff., a[i] /= (b[i] * c), kernel wrapper.
Definition VecOpMisc.cu:377
void addEqVc(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c)
Vector addition in-place w/ coefficient, a[i] += b[i] * c, kernel wrapper.
Definition VecOpMisc.cu:343
PSCF package top-level namespace.
Definition param_pc.dox:1
Utility classes for scientific computation.