1.0.0/Pulay_8h_source.html

 /*-------------------------------------------------------------------
 Copyright 2015 Ravishankar Sundararaman

 This file is part of JDFTx.

 JDFTx is free software: you can redistribute it and/or modify
 it under the terms of the GNU General Public License as published by
 the Free Software Foundation, either version 3 of the License, or
 (at your option) any later version.

 JDFTx is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU General Public License for more details.

 You should have received a copy of the GNU General Public License
 along with JDFTx.  If not, see <http://www.gnu.org/licenses/>.
 -------------------------------------------------------------------*/

 #ifndef JDFTX_CORE_PULAY_H
 #define JDFTX_CORE_PULAY_H

 #include <core/PulayParams.h>
 #include <core/Util.h>
 #include <electronic/matrix.h>
 #include <cfloat>

 template<typename Variable> class Pulay
 {
 public:
         Pulay(const PulayParams& pp);

         double minimize(double Eprev=+DBL_MAX, std::vector<string> extraNames=std::vector<string>(), std::vector<double> extraThresh=std::vector<double>());

         void loadState(const char* filename);
         void saveState(const char* filename) const;

         virtual double sync(double x) const { return x; }

 protected:
         //----- Interface specification -----

         virtual double cycle(double dEprev, std::vector<double>& extraValues)=0;

         virtual void report(int iter) {}
         virtual void axpy(double alpha, const Variable& X, Variable& Y) const=0;
         virtual double dot(const Variable& X, const Variable& Y) const=0;
         virtual size_t variableSize() const=0;
         virtual void readVariable(Variable&, FILE*) const=0;
         virtual void writeVariable(const Variable&, FILE*) const=0;
         virtual Variable getVariable() const=0;
         virtual void setVariable(const Variable&)=0;
         virtual Variable precondition(const Variable&) const=0;
         virtual Variable applyMetric(const Variable&) const=0;

 private:
         const PulayParams& pp;
         std::vector<Variable> pastVariables;
         std::vector<Variable> pastResiduals;
         matrix overlap;
 };


 //---------------------- Implementation ----------------------------

 #include <core/Minimize_linmin.h>
 #include <memory>

 //Norm convergence check (eigenvalue-difference or residual)
 //Make sure value is within tolerance for nCheck consecutive cycles
 class NormCheck
 {       unsigned nCheck; double threshold;
         std::deque<bool> history;
 public:
         NormCheck(unsigned nCheck, double threshold) : nCheck(nCheck), threshold(fabs(threshold)) {}
         bool checkConvergence(double norm)
         {       history.push_back(fabs(norm)<threshold);
                 if(history.size()==nCheck+1) history.pop_front(); //discard old unneeded elements
                 if(history.size()==nCheck)
                 {       for(bool converged: history)
                                 if(!converged)
                                         return false;
                         return true;
                 }
                 else return false;
         }
 };

 template<typename Variable> Pulay<Variable>::Pulay(const PulayParams& pp)
 : pp(pp), overlap(pp.history, pp.history)
 {
 }

 template<typename Variable> double Pulay<Variable>::minimize(double Eprev, std::vector<string> extraNames, std::vector<double> extraThresh)
 {
         double E = sync(Eprev); Eprev = 0.;
         double dE = E-Eprev;
         assert(extraNames.size()==extraThresh.size());

         //Initialize convergence checkers:
         EdiffCheck ediffCheck(2, pp.energyDiffThreshold); ediffCheck.checkConvergence(E); //store the initial energy in the check's history
         NormCheck resCheck(2, pp.residualThreshold);
         std::vector<std::shared_ptr<NormCheck> > extraCheck(extraNames.size());
         for(size_t iExtra=0; iExtra<extraNames.size(); iExtra++)
                 extraCheck[iExtra] = std::make_shared<NormCheck>(2, extraThresh[iExtra]);

         for(int iter=0; iter<pp.nIterations; iter++)
         {
                 //If history is full, remove oldest member
                 assert(pastResiduals.size() == pastVariables.size());
                 if((int)pastResiduals.size() >= pp.history)
                 {       size_t ndim = pastResiduals.size();
                         if(ndim>1) overlap.set(0,ndim-1, 0,ndim-1, overlap(1,ndim, 1,ndim));
                         pastVariables.erase(pastVariables.begin());
                         pastResiduals.erase(pastResiduals.begin());
                 }

                 //Cache the old energy and variables
                 Eprev = E;
                 pastVariables.push_back(getVariable());

                 //Perform cycle:
                 std::vector<double> extraValues(extraThresh.size());
                 E = sync(cycle(dE, extraValues));
                 dE = E - Eprev;
                 for(auto& v: extraValues) v = sync(v);

                 //Calculate and cache residual:
                 double residualNorm = 0.;
                 {       Variable residual = getVariable(); axpy(-1., pastVariables.back(), residual);
                         pastResiduals.push_back(residual);
                         residualNorm = sync(sqrt(dot(residual,residual)));
                 }

                 //Print energy and convergence parameters:
                 fprintf(pp.fpLog, "%sCycle: %2i   %s: ", pp.linePrefix, iter, pp.energyLabel);
                 fprintf(pp.fpLog, pp.energyFormat, E);
                 fprintf(pp.fpLog, "   d%s: %+.3e", pp.energyLabel, dE);
                 fprintf(pp.fpLog, "   |Residual|: %.3e", residualNorm);
                 for(size_t iExtra=0; iExtra<extraNames.size(); iExtra++)
                         fprintf(pp.fpLog, "   |%s|: %.3e", extraNames[iExtra].c_str(), extraValues[iExtra]);
                 fprintf(pp.fpLog, "\n"); fflush(pp.fpLog);

                 //Optional reporting:
                 report(iter);

                 //Check for convergence and update variable:
                 bool converged = false;
                 if(!converged && ediffCheck.checkConvergence(E))
                 {       fprintf(pp.fpLog, "%sConverged (|Delta E|<%le for 2 iters).\n\n", pp.linePrefix, pp.energyDiffThreshold);
                         converged = true;
                 }
                 if(!converged && resCheck.checkConvergence(residualNorm))
                 {       fprintf(pp.fpLog, "%sConverged (|Residual|<%le for 2 iters).\n\n", pp.linePrefix, pp.residualThreshold);
                         converged = true;
                 }
                 if(!converged && extraNames.size())
                         for(size_t iExtra=0; iExtra<extraNames.size(); iExtra++)
                                 if(extraCheck[iExtra]->checkConvergence(extraValues[iExtra]))
                                 {       fprintf(pp.fpLog, "%sConverged (|%s|<%le for 2 iters).\n\n", pp.linePrefix, extraNames[iExtra].c_str(), extraThresh[iExtra]);
                                         converged = true;
                                         break;
                                 }
                 fflush(pp.fpLog);
                 if(converged || killFlag) break; //converged or manually interrupted

                 //---- DIIS/Pulay mixing -----

                 //Update the overlap matrix
                 size_t ndim = pastResiduals.size();
                 Variable MlastResidual = applyMetric(pastResiduals.back());
                 for(size_t j=0; j<ndim; j++)
                 {       double thisOverlap = dot(pastResiduals[j], MlastResidual);
                         overlap.set(j, ndim-1, thisOverlap);
                         overlap.set(ndim-1, j, thisOverlap);
                 }

                 //Invert the residual overlap matrix to get the minimum of residual
                 matrix cOverlap(ndim+1, ndim+1); //Add row and column to enforce normalization constraint
                 cOverlap.set(0, ndim, 0, ndim, overlap(0, ndim, 0, ndim));
                 for(size_t j=0; j<ndim; j++)
                 {       cOverlap.set(j, ndim, 1);
                         cOverlap.set(ndim, j, 1);
                 }
                 cOverlap.set(ndim, ndim, 0);
                 matrix cOverlap_inv = inv(cOverlap);

                 //Update variable:
                 complex* coefs = cOverlap_inv.data();
                 Variable v;
                 for(size_t j=0; j<ndim; j++)
                 {       double alpha = coefs[cOverlap_inv.index(j, ndim)].real();
                         axpy(alpha, pastVariables[j], v);
                         axpy(alpha, precondition(pastResiduals[j]), v);
                 }
                 setVariable(v);
         }
         return E;
 }

 template<typename Variable> void Pulay<Variable>::loadState(const char* filename)
 {
         size_t nBytesCycle = 2 * variableSize(); //number of bytes per history entry
         size_t nBytesFile = fileSize(filename);
         size_t ndim = nBytesFile / nBytesCycle;
         size_t dimOffset = 0;
         if(int(ndim) > pp.history)
         {       dimOffset = ndim - pp.history;
                 ndim = pp.history;
         }
         if(nBytesFile % nBytesCycle != 0)
                 die("Pulay history file '%s' does not contain an integral multiple of the mixed variables and residuals.\n", filename);
         fprintf(pp.fpLog, "%sReading %lu past variables and residuals from '%s' ... ", pp.linePrefix, ndim, filename); logFlush();
         pastVariables.resize(ndim);
         pastResiduals.resize(ndim);
         FILE* fp = fopen(filename, "r");
         if(dimOffset) fseek(fp, dimOffset*nBytesCycle, SEEK_SET);
         for(size_t idim=0; idim<ndim; idim++)
         {       readVariable(pastVariables[idim], fp);
                 readVariable(pastResiduals[idim], fp);
         }
         fclose(fp);
         fprintf(pp.fpLog, "done.\n"); fflush(pp.fpLog);
         //Compute overlaps of loaded history:
         for(size_t i=0; i<ndim; i++)
         {       Variable Mresidual_i = applyMetric(pastResiduals[i]);
                 for(size_t j=0; j<=i; j++)
                 {       double thisOverlap = dot(pastResiduals[j], Mresidual_i);
                         overlap.set(i,j, thisOverlap);
                         overlap.set(j,i, thisOverlap);
                 }
         }
 }

 template<typename Variable> void Pulay<Variable>::saveState(const char* filename) const
 {
         if(mpiUtil->isHead())
         {       FILE* fp = fopen(filename, "w");
                 for(size_t idim=0; idim<pastVariables.size(); idim++)
                 {       writeVariable(pastVariables[idim], fp);
                         writeVariable(pastResiduals[idim], fp);
                 }
                 fclose(fp);
         }
 }


 #endif //JDFTX_CORE_PULAY_H
Pulay
Pulay mixing to optimize self-consistent field optimization .
Definition: Pulay.h:35

EdiffCheck
Definition: Minimize_linmin.h:27

sqrt
ScalarField sqrt(const ScalarField &)
Elementwise square root (preserve input)

Pulay::applyMetric
virtual Variable applyMetric(const Variable &) const =0
Apply metric to variable/residual.

PulayParams::energyDiffThreshold
double energyDiffThreshold
convergence threshold for energy difference between successive iterations
Definition: PulayParams.h:34

matrix
General complex matrix.
Definition: matrix.h:57

logFlush
#define logFlush()
fflush() for log files
Definition: Util.h:115

Pulay::dot
virtual double dot(const Variable &X, const Variable &Y) const =0
Euclidean dot product. Metric applied separately for efficiency.

PulayParams::nIterations
int nIterations
maximum iterations (single point calculation if 0)
Definition: PulayParams.h:33

MPIUtil::isHead
bool isHead() const
whether this is the root process (makes code more readable)
Definition: MPIUtil.h:39

PulayParams::linePrefix
const char * linePrefix
prefix for each output line of Pulay (default "Pulay: ")
Definition: PulayParams.h:29

matrix::index
int index(int i, int j) const
Index into data()
Definition: matrix.h:65

matrix::set
void set(int i, int j, complex m)
set element to m

fileSize
off_t fileSize(const char *filename)
Get the size of a file.

Pulay::precondition
virtual Variable precondition(const Variable &) const =0
Apply preconditioner to variable/residual.

Pulay::setVariable
virtual void setVariable(const Variable &)=0
Set the state of system to specified variable.

Pulay::readVariable
virtual void readVariable(Variable &, FILE *) const =0
Read variable from stream.

PulayParams
Parameters to control Pulay mixing.
Definition: PulayParams.h:26

Pulay::report
virtual void report(int iter)
Override to perform optional reporting.
Definition: Pulay.h:66

PulayParams::energyFormat
const char * energyFormat
printf format for the minimized quantity (default "%22.15le")
Definition: PulayParams.h:31

killFlag
bool killFlag
Flag set by signal handlers - all compute loops should quit cleanly when this is set.

PulayParams::fpLog
FILE * fpLog
Stream to log iterations to.
Definition: PulayParams.h:28

PulayParams::residualThreshold
double residualThreshold
convergence threshold on the residual
Definition: PulayParams.h:35

Pulay::loadState
void loadState(const char *filename)
Load the state from a single binary file.

die
#define die(...)
Quit with an error message (formatted using printf()). Must be called from all processes.
Definition: Util.h:118

Util.h
Miscellaneous utilities.

inv
ScalarField inv(const ScalarField &)
Elementwise reciprocal (preserve input)

Pulay::saveState
void saveState(const char *filename) const
Save the state to a single binary file.

Pulay::getVariable
virtual Variable getVariable() const =0
Write variable to stream.

Pulay::cycle
virtual double cycle(double dEprev, std::vector< double > &extraValues)=0
Single cycle of the self-consistency loop. In each subsequent cycle, Pulay will try to zero the diffe...

PulayParams::history
int history
Number of past residuals and vectors that are cached and used for mixing.
Definition: PulayParams.h:37

ManagedMemory::data
complex * data()
Return a pointer to the actual data Return a CPU pointer to the actual data, will move data from GPU ...

Pulay::sync
virtual double sync(double x) const
Override to synchronize scalars over MPI processes (if the same minimization is happening in sync ove...
Definition: Pulay.h:51

complex
Complex number (need to define our own because we need operators for gpu code as well) ...
Definition: scalar.h:49

Pulay::minimize
double minimize(double Eprev=+DBL_MAX, std::vector< string > extraNames=std::vector< string >(), std::vector< double > extraThresh=std::vector< double >())
Minimize energy using a self-consistent iteration.

PulayParams::energyLabel
const char * energyLabel
Label for the minimized quantity (default "E")
Definition: PulayParams.h:30

Pulay::axpy
virtual void axpy(double alpha, const Variable &X, Variable &Y) const =0
Scaled accumulate on variable.

Pulay::variableSize
virtual size_t variableSize() const =0
Number of bytes per variable.

assert
#define assert(expr)
A custom assertion with stack trace (NOTE: enabled in release modes as well)
Definition: Util.h:104