1#ifndef RPG_LR_AM_COMPRESSOR_TPP
2#define RPG_LR_AM_COMPRESSOR_TPP
11#include "LrAmPreCompressor.h"
12#include <rpg/System.h>
13#include <rpg/fts/compressor/intra/IntraCorrelation.h>
14#include <prdc/crystal/shiftToMinimum.h>
15#include <prdc/cuda/resources.h>
16#include <pscf/chem/Monomer.h>
17#include <pscf/mesh/MeshIterator.h>
32 { setClassName(
"LrAmPreCompressor"); }
52 const int nMonomer = system().mixture().nMonomer();
53 const int meshSize = system().domain().mesh().size();
54 IntVec<D> const & dimensions = system().mesh().dimensions();
61 for (
int i = 0; i < D; ++i) {
63 kMeshDimensions_[i] = dimensions[i];
65 kMeshDimensions_[i] = dimensions[i]/2 + 1;
71 for (
int i = 0; i < D; ++i) {
72 kSize_ *= kMeshDimensions_[i];
77 w0_.allocate(nMonomer);
78 wFieldTmp_.allocate(nMonomer);
79 error_.allocate(dimensions);
80 resid_.allocate(dimensions);
81 residK_.allocate(dimensions);
82 intraCorrelation_.allocate(kMeshDimensions_);
83 for (
int i = 0; i < nMonomer; ++i) {
84 w0_[i].allocate(dimensions);
85 wFieldTmp_[i].allocate(dimensions);
91 for (
int i = 0; i < nMonomer; ++i) {
96 intraCorrelation_ = intra_.computeIntraCorrelations();
129 double LrAmPreCompressor<D>::maxAbs(DeviceArray<cudaReal>
const & a)
137 LrAmPreCompressor<D>::updateBasis(
RingBuffer< DeviceArray<cudaReal> > & basis,
138 RingBuffer< DeviceArray<cudaReal> >
const & hists)
144 if (basis[0].isAllocated()) {
145 UTIL_CHECK(basis[0].capacity() == hists[0].capacity());
147 basis[0].allocate(hists[0].capacity());
155 LrAmPreCompressor<D>::addHistories(DeviceArray<cudaReal>& trial,
156 RingBuffer<DeviceArray<cudaReal> >
const & basis,
160 for (
int i = 0; i < nHist; i++) {
167 LrAmPreCompressor<D>::addPredictedError(DeviceArray<cudaReal>& fieldTrial,
168 DeviceArray<cudaReal>
const & resTrial,
176 bool LrAmPreCompressor<D>::hasInitialGuess()
177 {
return system().w().hasData(); }
181 int LrAmPreCompressor<D>::nElements()
182 {
return system().domain().mesh().size(); }
186 void LrAmPreCompressor<D>::getCurrent(DeviceArray<cudaReal>& curr)
199 void LrAmPreCompressor<D>::evaluate()
207 void LrAmPreCompressor<D>::getResidual(DeviceArray<cudaReal>& resid)
209 const int nMonomer = system().mixture().nMonomer();
210 const double vMonomer = system().mixture().vMonomer();
214 for (
int i = 1; i < nMonomer; i++) {
219 system().fft().forwardTransform(resid_, residK_);
225 system().fft().inverseTransformUnsafe(residK_, resid_);
234 void LrAmPreCompressor<D>::update(DeviceArray<cudaReal>& newGuess)
237 const int nMonomer = system().mixture().nMonomer();
240 for (
int i = 0; i < nMonomer; i++) {
245 system().setWRGrid(wFieldTmp_);
249 void LrAmPreCompressor<D>::outputToLog()
257 out <<
"Compressor times contributions:\n";
278 std::string errorType,
282 const int n = nElements();
283 const int nMonomer = system().mixture().nMonomer();
287 for (
int i = 1; i < nMonomer; i++) {
292 double maxRes = maxAbs(error_);
299 double rmsRes = normRes/sqrt(n);
302 Log::file() <<
"Max Residual = " <<
Dbl(maxRes,15) <<
"\n";
303 Log::file() <<
"Residual Norm = " <<
Dbl(normRes,15) <<
"\n";
311 if (errorType ==
"maxResid") {
313 }
else if (errorType ==
"normResid") {
315 }
else if (errorType ==
"rmsResid") {
318 UTIL_THROW(
"Invalid iterator error type in parameter file.");
323 if (errorType ==
"maxResid") {
325 }
else if (errorType ==
"normResid") {
327 }
else if (errorType ==
"rmsResid") {
328 error = normRes/sqrt(n);
330 UTIL_THROW(
"Invalid iterator error type in parameter file.");
Template for Anderson mixing iterator algorithm.
Dynamic array on the GPU device with aligned data.
int capacity() const
Return allocated capacity.
An IntVec<D, T> is a D-component vector of elements of integer type T.
Base class for iterators that impose incompressibility.
Anderson Mixing compressor with linear-response preconditioning.
LrAmPreCompressor(System< D > &system)
Constructor.
double computeError(DeviceArray< cudaReal > &residTrial, DeviceArray< cudaReal > &fieldTrial, std::string errorType, int verbose)
Compute and return error used to test for convergence.
void readParameters(std::istream &in)
Read all parameters and initialize.
void setup(bool isContinuation)
Initialize just before entry to iterative loop.
void clearTimers()
Reset / clear all timers.
int compress()
Compress to obtain partial saddle point w+.
void outputTimers(std::ostream &out)
Write a report of time contributions used by this algorithm.
~LrAmPreCompressor()
Destructor.
Main class for calculations that represent one system.
Dynamically allocatable contiguous array template.
Wrapper for a double precision number, for formatted ostream output.
static std::ostream & file()
Get log ostream by reference.
Class for storing history of previous values in an array.
File containing preprocessor macros for error handling.
#define UTIL_CHECK(condition)
Assertion macro suitable for serial or parallel production code.
#define UTIL_THROW(msg)
Macro for throwing an Exception, reporting function, file and line number.
cudaReal innerProduct(DeviceArray< cudaReal > const &a, DeviceArray< cudaReal > const &b)
Compute inner product of two real arrays (GPU kernel wrapper).
cudaReal maxAbs(DeviceArray< cudaReal > const &in)
Get maximum absolute magnitude of array elements (GPU kernel wrapper).
void addEqV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, const int beginIdA, const int beginIdB, const int n)
Vector addition in-place, a[i] += b[i], kernel wrapper (cudaReal).
void eqV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, const int beginIdA, const int beginIdB, const int n)
Vector assignment, a[i] = b[i], kernel wrapper (cudaReal).
void subVS(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c, const int beginIdA, const int beginIdB, const int n)
Vector subtraction, a[i] = b[i] - c, kernel wrapper (cudaReal).
void addVV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, DeviceArray< cudaReal > const &c, const int beginIdA, const int beginIdB, const int beginIdC, const int n)
Vector addition, a[i] = b[i] + c[i], kernel wrapper (cudaReal).
void subVV(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, DeviceArray< cudaReal > const &c, const int beginIdA, const int beginIdB, const int beginIdC, const int n)
Vector subtraction, a[i] = b[i] - c[i], kernel wrapper (cudaReal).
void divEqVc(DeviceArray< cudaComplex > &a, DeviceArray< cudaReal > const &b, cudaReal const c)
Vector division in-place w/ coeff., a[i] /= (b[i] * c), kernel wrapper.
void addEqVc(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c)
Vector addition in-place w/ coefficient, a[i] += b[i] * c, kernel wrapper.
PSCF package top-level namespace.
Utility classes for scientific computation.