1#ifndef PRDC_VEC_OP_MISC_H
2#define PRDC_VEC_OP_MISC_H
12#include <pscf/cuda/DeviceArray.h>
13#include <util/containers/DArray.h>
70void addVcVc(DeviceArray<cudaReal>& a,
71 DeviceArray<cudaReal>
const & b, cudaReal
const c,
72 DeviceArray<cudaReal>
const & d, cudaReal
const e);
86 DeviceArray<cudaReal>
const & b, cudaReal
const c,
87 DeviceArray<cudaReal>
const & d, cudaReal
const e,
88 DeviceArray<cudaReal>
const & f, cudaReal
const g);
97void addEqVc(DeviceArray<cudaReal>& a, DeviceArray<cudaReal>
const & b,
108void subVVS(DeviceArray<cudaReal>& a, DeviceArray<cudaReal>
const & b,
109 DeviceArray<cudaReal>
const & c, cudaReal
const d);
118void divEqVc(DeviceArray<cudaComplex>& a, DeviceArray<cudaReal>
const & b,
128void expVc(DeviceArray<cudaReal>& a, DeviceArray<cudaReal>
const & b,
142void eqVPair(DeviceArray<cudaReal>& a1, DeviceArray<cudaReal>& a2,
143 DeviceArray<cudaReal>
const & s);
154void mulVVPair(DeviceArray<cudaReal>& a1, DeviceArray<cudaReal>& a2,
155 DeviceArray<cudaReal>
const & b1,
156 DeviceArray<cudaReal>
const & b2,
157 DeviceArray<cudaReal>
const & s);
166void mulEqVPair(DeviceArray<cudaReal>& a1, DeviceArray<cudaReal>& a2,
167 DeviceArray<cudaReal>
const & s);
183void addVMany(DeviceArray<cudaReal>& a,
184 DArray<DeviceArray<cudaReal> >
const & vecs);
201void addVMany(DeviceArray<cudaReal>& a,
202 DArray<DeviceArray<cudaReal>
const *>
const & vecs);
214void mulVMany(DeviceArray<cudaReal>& a,
215 DArray<DeviceArray<cudaReal> >
const & vecs);
232void mulVMany(DeviceArray<cudaReal>& a,
233 DArray<DeviceArray<cudaReal>
const *>
const & vecs);
245void sqNormV(DeviceArray<cudaReal>& a, DeviceArray<cudaComplex>
const & b);
253void sqSqNormV(DeviceArray<cudaReal>& a, DeviceArray<cudaComplex>
const & b);
void addVMany(DeviceArray< cudaReal > &a, DArray< DeviceArray< cudaReal > > const &vecs)
Add an undefined number of vectors pointwise, kernel wrapper.
void addVcVcVc(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c, DeviceArray< cudaReal > const &d, cudaReal const e, DeviceArray< cudaReal > const &f, cudaReal const g)
3-vec addition w coeff, a[i] = (b[i]*c) + (d[i]*e) + (f[i]*g), kernel wrapper.
void expVc(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c)
Vector exponentiation w/ coefficient, a[i] = exp(b[i]*c), kernel wrapper.
void sqSqNormV(DeviceArray< cudaReal > &a, DeviceArray< cudaComplex > const &b)
Norm of complex number to the 4th power, a[i] = norm(b[i])^4, kernel wrapper.
void mulVVPair(DeviceArray< cudaReal > &a1, DeviceArray< cudaReal > &a2, DeviceArray< cudaReal > const &b1, DeviceArray< cudaReal > const &b2, DeviceArray< cudaReal > const &s)
Vector multiplication in pairs, ax[i] = bx[i] * s[i], kernel wrapper.
void addVcVc(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c, DeviceArray< cudaReal > const &d, cudaReal const e)
Vector addition w/ coefficient, a[i] = (b[i]*c) + (d[i]*e), kernel wrapper.
void mulVMany(DeviceArray< cudaReal > &a, DArray< DeviceArray< cudaReal > > const &vecs)
Multiply an undefined number of vectors pointwise, kernel wrapper.
void subVVS(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, DeviceArray< cudaReal > const &c, cudaReal const d)
Vector subtraction, a[i] = b[i] - c[i] - d, kernel wrapper.
void eqVPair(DeviceArray< cudaReal > &a1, DeviceArray< cudaReal > &a2, DeviceArray< cudaReal > const &s)
Vector assignment in pairs, ax[i] = b[i], kernel wrapper.
void sqNormV(DeviceArray< cudaReal > &a, DeviceArray< cudaComplex > const &b)
Squared norm of complex number, a[i] = norm(b[i])^2, kernel wrapper.
void divEqVc(DeviceArray< cudaComplex > &a, DeviceArray< cudaReal > const &b, cudaReal const c)
Vector division in-place w/ coeff., a[i] /= (b[i] * c), kernel wrapper.
void mulEqVPair(DeviceArray< cudaReal > &a1, DeviceArray< cudaReal > &a2, DeviceArray< cudaReal > const &s)
In-place vector multiplication in pairs, ax[i] *= s[i], kernel wrapper.
void addEqVc(DeviceArray< cudaReal > &a, DeviceArray< cudaReal > const &b, cudaReal const c)
Vector addition in-place w/ coefficient, a[i] += b[i] * c, kernel wrapper.
PSCF package top-level namespace.