madness/solver_8h_source.html

 /*

   This file is part of MADNESS.


   Copyright (C) 2007,2010 Oak Ridge National Laboratory


   This program is free software; you can redistribute it and/or modify

   it under the terms of the GNU General Public License as published by

   the Free Software Foundation; either version 2 of the License, or

   (at your option) any later version.


   This program is distributed in the hope that it will be useful,

   but WITHOUT ANY WARRANTY; without even the implied warranty of

   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

   GNU General Public License for more details.


   You should have received a copy of the GNU General Public License

   along with this program; if not, write to the Free Software

   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA


   For more information please contact:


   Robert J. Harrison

   Oak Ridge National Laboratory

   One Bethel Valley Road

   P.O. Box 2008, MS-6367


   email: harrisonrj@ornl.gov

   tel:   865-241-3937

   fax:   865-572-0680


   $Id$

 */

 #include <madness/mra/mra.h>

 //#include <madness/mra/lbdeux.h>

 #include <madness/world/world.h>

 #include <madness/tensor/solvers.h>

 #include <vector>

 #include <madness/fortran_ctypes.h>

 #include <cmath>


 #include "poperator.h"

 #include "libxc.h"

 #include "electronicstructureparams.h"

 #include "complexfun.h"

 #include "esolver.h"


 #ifndef SOLVER_H_


 using std::endl;

 using std::setfill;

 using std::setw;

 using std::ostream;


 //*****************************************************************************

 /* static double onesfunc(const coordT& x) */

 /* { */

 /*   return 1.0; */

 /* } */

 //*****************************************************************************


 namespace madness

 {

   //***************************************************************************

   template <typename T>

   T stheta_fd(const T& x)

   {

     if (x > 50.0)

     {

       return 1.0;

     }

     else if (x < -50.0)

     {

       return 0.0;

     }

     else

     {

       return 1.0/(1.0 + exp(-x));

     }

   }

   //***************************************************************************


   // NOTE: so this is totally hacked because of the requirement of using a box

   //       of L*L*L rather than the convention of using a combination of

   //       lattice vectors and reciprocal lattice vectors (FOR NOW)

   // On second thought, it might be ok for general use if used "right".

   //***************************************************************************

   template <std::size_t NDIM>

   class ComplexExp : public FunctionFunctorInterface<double_complex,NDIM> {

   public:

       typedef Vector<double,NDIM> coordT;

       typedef Vector<double,NDIM> vec3dT;

       const double_complex coeff;

       const vec3dT exponent;


       ComplexExp(vec3dT exponent, double_complex coeff)

               : exponent(exponent), coeff(coeff) {}


       double_complex operator()(const coordT& x) const {

           double sum = 0.0;

           for (std::size_t i=0; i<NDIM; ++i) {

               sum += x[i]*exponent[i];

           };

           return coeff*exp(double_complex(0.0,sum));

       }

   };

   //***************************************************************************


   //***************************************************************************

   class WSTAtomicBasisFunctor : public FunctionFunctorInterface<double_complex,3> {

   private:

       const AtomicBasisFunction aofunc;

       double L;

       double kx, ky, kz;


       std::vector<coord_3d> specialpt;

   public:

       WSTAtomicBasisFunctor(const AtomicBasisFunction& aofunc, double L, double kx, double ky, double kz)

           : aofunc(aofunc), L(L), kx(kx), ky(ky), kz(kz)

       {

         double x, y, z;

           aofunc.get_coords(x,y,z);

           coord_3d r;

           r[0]=x; r[1]=y; r[2]=z;

           specialpt=std::vector<coord_3d>(1,r);

       }


       ~WSTAtomicBasisFunctor() {}


       double_complex operator()(const coord_3d& x) const {

           double_complex sum = 0.0;

           const int R = 1;

           const double_complex I = double_complex(0.0,1.0);

           for (int i=-R; i<=+R; i++) {

               double xx = x[0]+i*L;

               for (int j=-R; j<=+R; j++) {

                   double yy = x[1]+j*L;

                   for (int k=-R; k<=+R; k++) {

                       double zz = x[2]+k*L;

                       sum += -exp(-I*(kx*xx+ky*yy+kz*zz+constants::pi/2))*aofunc(xx, yy, zz);

                       //print(kx,ky,kz,exp(-I*(kx*xx+ky*yy+kz*zz+constants::pi/2)),aofunc(xx, yy, zz));

                   }

               }

           }

           return sum;

       }


       std::vector<coord_3d> special_points() const {return specialpt;}

   };

   //***************************************************************************


   //***************************************************************************

   class DipoleFunctor : public FunctionFunctorInterface<double,3> {

   private:

       const int axis;

   public:

       DipoleFunctor(int axis) : axis(axis) {}

       double operator()(const coordT& x) const {

           return x[axis];

       }

       virtual ~DipoleFunctor() {}

   };

   //***************************************************************************


   //***************************************************************************

   template <typename T, int NDIM>

   class SubspaceK

   {

     // Typedef's

     typedef std::complex<T> valueT;

     typedef Function<valueT,NDIM> functionT;

     typedef std::vector<functionT> vecfuncT;

     typedef std::pair<vecfuncT,vecfuncT> pairvecfuncT;

     typedef std::vector<pairvecfuncT> subspaceT;

     typedef Tensor<valueT> tensorT;

     typedef std::vector<tensorT> vectensorT;

     typedef std::vector<subspaceT> vecsubspaceT;


     //*************************************************************************

     World& _world;

     //*************************************************************************


     //*************************************************************************

     vectensorT _Q;

     //*************************************************************************


     //*************************************************************************

     vecsubspaceT _subspace;

     //*************************************************************************


     //*************************************************************************

     std::vector<KPoint> _kpoints;

     //*************************************************************************


     //*************************************************************************

     ElectronicStructureParams _params;

     //*************************************************************************


     //*************************************************************************

     double _residual;

     //*************************************************************************


   public:


     //*************************************************************************

     SubspaceK(World& world, const ElectronicStructureParams& params,

             const std::vector<KPoint>& kpoints) : _world(world), _kpoints(kpoints),

             _params(params)

     {

       _residual = 1e6;

       for (unsigned int kp = 0; kp < _kpoints.size(); kp++)

       {

         _Q.push_back(tensorT(1,1));

         _subspace.push_back(subspaceT());

       }

     }

     //*************************************************************************


     //*************************************************************************

     void update_subspace(vecfuncT& awfs_new,

                          vecfuncT& bwfs_new,

                          const vecfuncT& awfs_old,

                          const vecfuncT& bwfs_old)

     {

       // compute residuals (total)

       vecfuncT t_rm = sub(_world, awfs_old, awfs_new);

       if (_params.spinpol)

       {

         vecfuncT br = sub(_world, bwfs_old, bwfs_new);

         t_rm.insert(t_rm.end(), br.begin(), br.end());

       }

       std::vector<double> rnvec = norm2<valueT,NDIM>(_world, t_rm);

       if (_world.rank() == 0)

       {

         double rnorm = 0.0;

         for (unsigned int i = 0; i < rnvec.size(); i++) rnorm += rnvec[i];

         if (_world.rank() == 0) print("residual = ", rnorm);

         _residual = rnorm;

       }

       _world.gop.broadcast(_residual, 0);


       for (unsigned int kp = 0; kp < _kpoints.size(); kp++)

       {

         KPoint kpoint = _kpoints[kp];


         vecfuncT k_phisa(awfs_old.begin() + kpoint.begin, awfs_old.begin() + kpoint.end);

         vecfuncT k_phisb(bwfs_old.begin() + kpoint.begin, bwfs_old.begin() + kpoint.end);

         vecfuncT k_awfs(awfs_new.begin() + kpoint.begin, awfs_new.begin() + kpoint.end);

         vecfuncT k_bwfs(bwfs_new.begin() + kpoint.begin, bwfs_new.begin() + kpoint.end);


         // compute residuals for k-point

         // concatentate up and down spins

         vecfuncT k_rm = sub(_world, k_phisa, k_awfs);

         vecfuncT k_vm(k_phisa);

         if (_params.spinpol)

         {

           vecfuncT k_br = sub(_world, k_phisb, k_bwfs);

           k_rm.insert(k_rm.end(), k_br.begin(), k_br.end());

           k_vm.insert(k_vm.end(), k_phisb.begin(), k_phisb.end());

         }


         // Update subspace and matrix Q

         compress(_world, k_vm, false);

         compress(_world, k_rm, false);

         _world.gop.fence();

         subspaceT k_subspace = _subspace[kp];

         k_subspace.push_back(pairvecfuncT(k_vm,k_rm));


         int m = k_subspace.size();

         tensorT ms(m);

         tensorT sm(m);

         for (int s = 0; s < m; s++)

         {

             const vecfuncT& k_vs = k_subspace[s].first;

             const vecfuncT& k_rs = k_subspace[s].second;

             for (unsigned int i = 0; i < k_vm.size(); i++)

             {

                 ms[s] += k_vm[i].inner_local(k_rs[i]);

                 sm[s] += k_vs[i].inner_local(k_rm[i]);

             }

         }

         _world.gop.sum(ms.ptr(),m);

         _world.gop.sum(sm.ptr(),m);


         tensorT newQ(m,m);

         if (m > 1) newQ(Slice(0,-2),Slice(0,-2)) = _Q[kp];

         newQ(m-1,_) = ms;

         newQ(_,m-1) = sm;


         _Q[kp] = newQ;

         if (_world.rank() == 0) print(_Q[kp]);


         // Solve the subspace equations

         tensorT c;

         if (_world.rank() == 0) {

             double rcond = 1e-12;

             while (1) {

                 c = KAIN(_Q[kp],rcond);

                 if (abs(c[m-1]) < 3.0) {

                     break;

                 }

                 else if (rcond < 0.01) {

                     if (_world.rank() == 0)

                       print("Increasing subspace singular value threshold ", c[m-1], rcond);

                     rcond *= 100;

                 }

                 else {

                     if (_world.rank() == 0)

                       print("Forcing full step due to subspace malfunction");

                     c = 0.0;

                     c[m-1] = 1.0;

                     break;

                 }

             }

         }


         _world.gop.broadcast_serializable(c, 0);

         if (_world.rank() == 0) {

             //print("Subspace matrix");

             //print(Q);

             print("Subspace solution", c);

         }


         // Form linear combination for new solution

         vecfuncT k_phisa_new = zero_functions<valueT,NDIM>(_world, k_phisa.size());

         vecfuncT k_phisb_new = zero_functions<valueT,NDIM>(_world, k_phisb.size());

         compress(_world, k_phisa_new, false);

         compress(_world, k_phisb_new, false);

         _world.gop.fence();

         std::complex<double> one = std::complex<double>(1.0,0.0);

         unsigned int norbitals = awfs_old.size() / _kpoints.size();

         for (unsigned int m = 0; m < k_subspace.size(); m++)

         {

             const vecfuncT& k_vm = k_subspace[m].first;

             const vecfuncT& k_rm = k_subspace[m].second;

             // WSTHORNTON Stopped here!

             const vecfuncT  vma(k_vm.begin(),k_vm.begin() + norbitals);

             const vecfuncT  rma(k_rm.begin(),k_rm.begin() + norbitals);

             const vecfuncT  vmb(k_vm.end() - norbitals, k_vm.end());

             const vecfuncT  rmb(k_rm.end() - norbitals, k_rm.end());


             gaxpy(_world, one, k_phisa_new, c(m), vma, false);

             gaxpy(_world, one, k_phisa_new,-c(m), rma, false);

             gaxpy(_world, one, k_phisb_new, c(m), vmb, false);

             gaxpy(_world, one, k_phisb_new,-c(m), rmb, false);

         }

         _world.gop.fence();


         if (_params.maxsub <= 1) {

             // Clear subspace if it is not being used

             k_subspace.clear();

         }

         else if (k_subspace.size() == _params.maxsub) {

             // Truncate subspace in preparation for next iteration

             k_subspace.erase(k_subspace.begin());

             _Q[kp] = _Q[kp](Slice(1,-1),Slice(1,-1));

         }

         // Save subspace

         _subspace[kp] = k_subspace;


         for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

           wi++, fi++)

         {

           awfs_new[wi] = k_phisa_new[fi];

           bwfs_new[wi] = k_phisb_new[fi];

         }

       }

     }

     //*************************************************************************


   };


   //***************************************************************************

   template <typename T, int NDIM>

   class Subspace

   {

     // Typedef's

     typedef std::complex<T> valueT;

     typedef Function<valueT,NDIM> functionT;

     typedef std::vector<functionT> vecfuncT;

     typedef std::pair<vecfuncT,vecfuncT> pairvecfuncT;

     typedef std::vector<pairvecfuncT> subspaceT;

     typedef Tensor<valueT> tensorT;


     //*************************************************************************

     World& _world;

     //*************************************************************************


     //*************************************************************************

     tensorT _Q;

     //*************************************************************************


     //*************************************************************************

     subspaceT _subspace;

     //*************************************************************************


     //*************************************************************************

     std::vector<KPoint> _kpoints;

     //*************************************************************************


     //*************************************************************************

     ElectronicStructureParams _params;

     //*************************************************************************


   public:


     //*************************************************************************

     Subspace(World& world, const ElectronicStructureParams& params)

       : _world(world), _params(params)

     {

     }

     //*************************************************************************


     //*************************************************************************

     void update_subspace(vecfuncT& awfs_new,

                          vecfuncT& bwfs_new,

                          const vecfuncT& awfs_old,

                          const vecfuncT& bwfs_old,

                          const vecfuncT& rm)

     {

       // concatentate up and down spins

       vecfuncT vm = awfs_old;

       if (_params.spinpol)

       {

         vm.insert(vm.end(), bwfs_old.begin(), bwfs_old.end());

       }


       // Update subspace and matrix Q

       compress(_world, vm, false);

       compress(_world, rm, false);

       _world.gop.fence();

       _subspace.push_back(pairvecfuncT(vm,rm));


       int m = _subspace.size();

       tensorT ms(m);

       tensorT sm(m);

       for (int s=0; s<m; s++)

       {

           const vecfuncT& vs = _subspace[s].first;

           const vecfuncT& rs = _subspace[s].second;

           for (unsigned int i=0; i<vm.size(); i++)

           {

               ms[s] += vm[i].inner_local(rs[i]);

               sm[s] += vs[i].inner_local(rm[i]);

           }

       }

       _world.gop.sum(ms.ptr(),m);

       _world.gop.sum(sm.ptr(),m);


       tensorT newQ(m,m);

       if (m > 1) newQ(Slice(0,-2),Slice(0,-2)) = _Q;

       newQ(m-1,_) = ms;

       newQ(_,m-1) = sm;


       _Q = newQ;

       if (_world.rank() == 0) print(_Q);


       // Solve the subspace equations

       tensorT c;

       if (_world.rank() == 0) {

           double rcond = 1e-12;

           while (1) {

               c = KAIN(_Q,rcond);

               if (abs(c[m-1]) < 3.0) {

                   break;

               }

               else if (rcond < 0.01) {

                   if (_world.rank() == 0)

                     print("Increasing subspace singular value threshold ", c[m-1], rcond);

                   rcond *= 100;

               }

               else {

                   if (_world.rank() == 0)

                     print("Forcing full step due to subspace malfunction");

                   c = 0.0;

                   c[m-1] = 1.0;

                   break;

               }

           }

       }


       _world.gop.broadcast_serializable(c, 0);

       if (_world.rank() == 0) {

           //print("Subspace matrix");

           //print(Q);

           print("Subspace solution", c);

       }


       // Form linear combination for new solution

       vecfuncT phisa_new = zero_functions<valueT,NDIM>(_world, awfs_old.size());

       vecfuncT phisb_new = zero_functions<valueT,NDIM>(_world, bwfs_old.size());

       compress(_world, phisa_new, false);

       compress(_world, phisb_new, false);

       _world.gop.fence();

       std::complex<double> one = std::complex<double>(1.0,0.0);

       for (unsigned int m=0; m<_subspace.size(); m++) {

           const vecfuncT& vm = _subspace[m].first;

           const vecfuncT& rm = _subspace[m].second;

           const vecfuncT  vma(vm.begin(),vm.begin()+awfs_old.size());

           const vecfuncT  rma(rm.begin(),rm.begin()+awfs_old.size());

           const vecfuncT  vmb(vm.end()-bwfs_old.size(), vm.end());

           const vecfuncT  rmb(rm.end()-bwfs_old.size(), rm.end());


           gaxpy(_world, one, phisa_new, c(m), vma, false);

           gaxpy(_world, one, phisa_new,-c(m), rma, false);

           gaxpy(_world, one, phisb_new, c(m), vmb, false);

           gaxpy(_world, one, phisb_new,-c(m), rmb, false);

       }

       _world.gop.fence();


       if (_params.maxsub <= 1) {

           // Clear subspace if it is not being used

           _subspace.clear();

       }

       else if (_subspace.size() == _params.maxsub) {

           // Truncate subspace in preparation for next iteration

           _subspace.erase(_subspace.begin());

           _Q = _Q(Slice(1,-1),Slice(1,-1));

       }

       awfs_new = phisa_new;

       bwfs_new = phisb_new;

     }

     //*************************************************************************


     //*************************************************************************

     void reproject()

     {

       //  //if (_world.rank() == 0)

       //    //printf("\n\nreprojecting subspace to wavelet order: %d and thresh: %.5e\n\n",

       //    //FunctionDefaults<3>::get_k(), FunctionDefaults<3>::get_thresh());

       //

       //  unsigned int m = _subspace.size();

       //  for (unsigned int s = 0; s < m; s++)

       //  {

       //      vecfuncT& vs = _subspace[s].first;

       //      vecfuncT& rs = _subspace[s].second;

       //      reconstruct(_world, vs);

       //      reconstruct(_world, rs);

       //      unsigned int vm = vs.size();

       //      for (unsigned int i = 0; i < vm; i++)

       //      {

       //        vs[i] = madness::project(vs[i], FunctionDefaults<3>::get_k(),

       //          FunctionDefaults<3>::get_thresh(), false);

       //        rs[i] = madness::project(rs[i], FunctionDefaults<3>::get_k(),

       //          FunctionDefaults<3>::get_thresh(), false);

       //      }

       //      _world.gop.fence();

       //      truncate(_world, vs);

       //      truncate(_world, rs);

       //      normalize(_world, vs);

       //  }

       //  _world.gop.fence();


     }

     //*************************************************************************


   };


 //  template <typename T, int NDIM>

 //  struct lbcost {

 //      double leaf_value;

 //      double parent_value;

 //      lbcost(double leaf_value=1.0, double parent_value=0.0) : leaf_value(leaf_value), parent_value(parent_value) {}

 //      double operator()(const Key<NDIM>& key, const FunctionNode<T,NDIM>& node) const {

 //          if (key.level() <= 1) {

 //              return 100.0*(leaf_value+parent_value);

 //          }

 //          else if (node.is_leaf()) {

 //              return leaf_value;

 //          }

 //          else {

 //              return parent_value;

 //          }

 //      }

 //  };


   //***************************************************************************


   //***************************************************************************

   template <typename T, int NDIM>

   class Solver

   {

     // Typedef's

     typedef std::complex<T> valueT;

     typedef Function<T,NDIM> rfunctionT;

     typedef FunctionFactory<T,NDIM> rfactoryT;

     typedef Function<valueT,NDIM> functionT;

     typedef std::vector<functionT> vecfuncT;

     typedef FunctionFactory<valueT,NDIM> factoryT;

     typedef Vector<double,NDIM> kvecT;

     typedef SeparatedConvolution<T,3> operatorT;

     typedef std::shared_ptr<operatorT> poperatorT;

     typedef Tensor<double> rtensorT;

     typedef Tensor<std::complex<double> > ctensorT;

     typedef Tensor<valueT> tensorT;

     typedef std::pair<vecfuncT,vecfuncT> pairvecfuncT;

     typedef std::vector<pairvecfuncT> subspaceT;

     typedef std::vector<tensorT> vectensorT;

     typedef std::vector<subspaceT> vecsubspaceT;


     //*************************************************************************

     World& _world;

     //*************************************************************************


     //*************************************************************************

     // This variable could either be a nuclear potiential or a nuclear charge

     // density depending on the "ispotential" boolean variable in the

     // ElectronicStructureParams class.

     rfunctionT _vnucrhon;

     //*************************************************************************


     //*************************************************************************

     vecfuncT _phisa;

     //*************************************************************************


     //*************************************************************************

     vecfuncT _phisb;

     //*************************************************************************


     //*************************************************************************

     std::vector<T> _eigsa;

     //*************************************************************************


     //*************************************************************************

     std::vector<T> _eigsb;

     //*************************************************************************


     //*************************************************************************

     ElectronicStructureParams _params;

     //*************************************************************************


     //*************************************************************************

     std::vector<KPoint> _kpoints;

     //*************************************************************************


     //*************************************************************************

     std::vector<double> _occsa;

     //*************************************************************************


     //*************************************************************************

     std::vector<double> _occsb;

     //*************************************************************************


     //*************************************************************************

     rfunctionT _rhoa;

     //*************************************************************************


     //*************************************************************************

     rfunctionT _rhob;

     //*************************************************************************


     //*************************************************************************

     rfunctionT _rho;

     //*************************************************************************


     //*************************************************************************

     rfunctionT _vnuc;

     //*************************************************************************


     //*************************************************************************

     SeparatedConvolution<T,NDIM>* _cop;

     //*************************************************************************


 //    //*************************************************************************

 //    vecsubspaceT _subspace;

 //    //*************************************************************************

 //

 //    //*************************************************************************

 //    vectensorT _Q;

 //    //*************************************************************************


     //*************************************************************************

     Subspace<T,NDIM>* _subspace;

     //*************************************************************************


     //*************************************************************************

     MolecularEntity _mentity;

     //*************************************************************************


     //*************************************************************************

     double _residual;

     //*************************************************************************


     //*************************************************************************

     AtomicBasisSet _aobasis;

     //*************************************************************************


     //*************************************************************************

     double _maxthresh;

     //*************************************************************************


     //*************************************************************************

     std::ofstream _outputF;

     //*************************************************************************


     //*************************************************************************

     std::ofstream _matF;

     //*************************************************************************


     //*************************************************************************

     std::ofstream _eigF;

     //*************************************************************************


     //*************************************************************************

     std::ofstream _kmeshF;

     //*************************************************************************


     //*************************************************************************

     int _it;

     //*************************************************************************


     //*************************************************************************

     cvecfuncT _aobasisf;

     //*************************************************************************


     //*************************************************************************

     int _nao;

     //*************************************************************************


   public:


     //*************************************************************************

     double ttt, sss;

     void START_TIMER(World& world) {

         world.gop.fence(); ttt=wall_time(); sss=cpu_time();

     }


     void END_TIMER(World& world, const char* msg) {

     ttt=wall_time()-ttt; sss=cpu_time()-sss; if (world.rank()==0) printf("timer: %20.20s %8.2fs %8.2fs\n", msg, sss, ttt);

     }

     //*************************************************************************


     //*************************************************************************

     Solver(World& world, const std::string& filename) : _world(world)

     {

       init(filename);

       if (_params.periodic) FunctionDefaults<3>::set_bc(BC_PERIODIC);

       _residual = 1e5;

       make_nuclear_potential();


       if (_params.restart==0) initial_guess();

 //      for (unsigned int kp = 0; kp < _kpoints.size(); kp++)

 //      {

 //        _Q.push_back(tensorT(1,1));

 //        _subspace.push_back(subspaceT());

 //      }

       _subspace = new Subspace<T,NDIM>(world, _params);

     }

     //*************************************************************************


     //*************************************************************************

     void init(const std::string& filename)

     {


       // params

       if (_world.rank() == 0)

       {

         _params.read_file(filename);

         //_params.fractional = false;

       }

       // Send params

       _world.gop.broadcast_serializable(_params, 0);

       if (_params.centered)

         FunctionDefaults<3>::set_cubic_cell(-_params.L/2,_params.L/2);

       else

         FunctionDefaults<3>::set_cubic_cell(-_params.L/2,_params.L/2);

 //        FunctionDefaults<3>::set_cubic_cell(0,_params.L);

       FunctionDefaults<3>::set_thresh(_params.thresh);

       FunctionDefaults<3>::set_k(_params.waveorder);


       // mentity and aobasis

       if (_world.rank() == 0)

       {

         _aobasis.read_file(_params.basis);

         _mentity.read_file(filename, _params.fractional);

         if (_params.centered) _mentity.center();

       }

       // Send mentity and aobasis

       _world.gop.broadcast_serializable(_mentity, 0);

       _world.gop.broadcast_serializable(_aobasis, 0);

       // set number of electrons to the total nuclear charge of the mentity

       _params.nelec = _mentity.total_nuclear_charge();

       // total number of bands include empty

       _params.nbands = (_params.nelec/2) + _params.nempty;

       _params.ncharge = _mentity.total_nuclear_charge();

       if ((_params.nelec % 2) == 1) _params.nelec++;


       // Open output files

       _outputF.open("output.txt");

       _matF.open("matrix.txt");

       _eigF.open("eigs.txt");


       // kmesh

       if (_params.restart == 0)

       {

         if (_params.periodic) // PERIODIC

         {

           // GAMMA POINT

           if ((_params.ngridk0 == 1) && (_params.ngridk1 == 1) && (_params.ngridk2 == 1))

           {

             _kpoints.push_back(KPoint(coordT(0.0), 1.0));

           }

           if ((_params.ngridk0 == 0) && (_params.ngridk1 == 0) && (_params.ngridk2 == 0))

           {

             double TWO_PI = 2.0 * madness::constants::pi;

             double t1 = TWO_PI/_params.L;

             coordT c1 = vec(0.0,0.0,0.0);

             coordT c2 = vec(0.5*t1,0.5*t1,0.5*t1);

             _kpoints.push_back(KPoint(c1, 0.5));

             _kpoints.push_back(KPoint(c2, 0.5));

           }

           else // NORMAL BANDSTRUCTURE

           {

             _kpoints = genkmesh(_params.ngridk0, _params.ngridk1,

                                 _params.ngridk2, _params.koffset0,

                                 _params.koffset1, _params.koffset2,

                                 _params.L);

           }

         }

         else // NOT-PERIODIC

         {

           _kpoints.push_back(KPoint(coordT(0.0), 1.0));

         }

         if (_world.rank() == 0)

         {

           _kmeshF.open("kpoints.txt");

           _kmeshF << "kpts: " << _kpoints.size() << endl;

           _kmeshF << "ik" << setw(10) << "kpt" << setw(30) << "weight" << endl;

           _kmeshF << "--" << setw(10) << "---" << setw(30) << "------" << endl;


           //_kmeshF << setfill('-') << setw(55) << "-" << endl;

           //_kmeshF << setfill(' ') << endl;

           _kmeshF << endl;

           for (unsigned int i = 0; i < _kpoints.size(); i++)

           {

             KPoint kpoint = _kpoints[i];

             _kmeshF << i << setw(10) << kpoint.k[0];

             _kmeshF << setw(10) << kpoint.k[1];

             _kmeshF << setw(10) << kpoint.k[2];

             _kmeshF << setw(10) << kpoint.weight << endl;

           }

           _kmeshF.close();

         }

       }

       else

       {

         load_orbitals();

       }

     }

     //*************************************************************************


     //*************************************************************************

     std::vector<KPoint> genkmesh(unsigned int ngridk0, unsigned ngridk1, unsigned int ngridk2,

                                  double koffset0, double koffset1, double koffset2, double R)

     {

       std::vector<KPoint> kmesh;

       double step0 = 1.0/ngridk0;

       double step1 = 1.0/ngridk1;

       double step2 = 1.0/ngridk2;

       double weight = 1.0/(ngridk0*ngridk1*ngridk2);

       double TWO_PI = 2.0 * madness::constants::pi;

       for (unsigned int i = 0; i < ngridk0; i++)

       {

         for (unsigned int j = 0; j < ngridk1; j++)

         {

           for (unsigned int k = 0; k < ngridk2; k++)

           {

             //double k0 = (i*step0 - step0/2) * TWO_PI/R;

             //double k1 = (j*step1 - step1/2) * TWO_PI/R;

             //double k2 = (k*step2 - step2/2) * TWO_PI/R;

             double k0 = ((i*step0)+koffset0) * TWO_PI/R;

             double k1 = ((j*step1)+koffset1) * TWO_PI/R;

             double k2 = ((k*step2)+koffset2) * TWO_PI/R;

             KPoint kpoint(k0, k1, k2, weight);

             kmesh.push_back(kpoint);

           }

         }

       }

       return kmesh;

     }

     //*************************************************************************


     //*************************************************************************

     void save_orbitals()

     {

       archive::ParallelOutputArchive ar(_world, "orbitals", _params.nio);

       ar & _params.spinpol;

       ar & (unsigned int)(_kpoints.size());

       for (unsigned int i = 0; i < _kpoints.size(); i++) ar & _kpoints[i];

 //      ar & (unsigned int)(_occsa.size());

 //      for (unsigned int i = 0; i < _occsa.size(); i++) ar & _occsa[i];

       ar & (unsigned int)(_phisa.size());

       for (unsigned int i = 0; i < _phisa.size(); i++) ar & _phisa[i];

       if (_params.spinpol)

       {

 //        ar & (unsigned int)(_occsb.size());

 //        for (unsigned int i = 0; i < _occsb.size(); i++) ar & _occsb[i];

         ar & (unsigned int)(_phisb.size());

         for (unsigned int i = 0; i < _phisb.size(); i++) ar & _phisb[i];

       }

     }

     //*************************************************************************


     //*************************************************************************

     void load_orbitals()

     {

       const double thresh = FunctionDefaults<3>::get_thresh();

       const int k = FunctionDefaults<3>::get_k();


       archive::ParallelInputArchive ar(_world, "orbitals");


       // spin-polarized

       bool spinrest;

       ar & spinrest;

       // kpoints

       unsigned int nkpts;

       ar & nkpts;

       _kpoints.clear();

       for (unsigned int i = 0; i < nkpts; i++)

       {

         KPoint tkpt;

         ar & tkpt;

         _kpoints.push_back(tkpt);

       }

       // occs

 //      unsigned int noccs;

 //      ar & noccs;

 //      _occs.clear();

 //      for (unsigned int i = 0; i < noccs; i++)

 //      {

 //        double tocc;

 //        ar & tocc;

 //        _occs.push_back(tocc);

 //      }

       // orbitals

       unsigned int norbs;

       ar & norbs;

       _phisa.clear();

       _eigsa.clear();

       for (unsigned int i = 0; i < norbs; i++)

       {

         functionT tfunc;

         ar & tfunc;

         _phisa.push_back(tfunc);

         _eigsa.push_back(-0.1);

       }

       // check for k mismatch

       if (_phisa[0].k() != k)

       {

         reconstruct(_world,_phisa);

         for (unsigned int i = 0; i < _phisa.size(); i++)

           _phisa[i] = madness::project(_phisa[i], k, thresh, false);

         _world.gop.fence();

       }

       // orthonormalize

       for (unsigned int i = 0; i < _kpoints.size(); i++)

         gram_schmidt(_phisa, _kpoints[i]);


       if (_params.spinpol)

       {

         _phisb.clear();

         _eigsb.clear();

         for (unsigned int i = 0; i < norbs; i++)

         {

           functionT tfunc;

           ar & tfunc;

           _phisb.push_back(tfunc);

           _eigsb.push_back(-0.1);

         }

         // check for k mismatch

         if (_phisb[0].k() != k)

         {

           reconstruct(_world,_phisb);

           for (unsigned int i = 0; i < _phisb.size(); i++)

             _phisb[i] = madness::project(_phisb[i], k, thresh, false);

           _world.gop.fence();

         }

         // orthonormalize

         for (unsigned int i = 0; i < _kpoints.size(); i++)

           gram_schmidt(_phisb, _kpoints[i]);

       }

       else

       {

         for (unsigned int i = 0; i < norbs; i++)

         {

           _phisb.push_back(_phisa[i]);

           _eigsb.push_back(_eigsa[i]);

         }

       }

       // create vector for occupation numbers

       _occsa = std::vector<double>(norbs, 0.0);

       _occsb = std::vector<double>(norbs, 0.0);

     }

     //*************************************************************************


     //*************************************************************************

     void make_nuclear_potential_impl()

     {

       _vnucrhon = rfactoryT(_world).functor(rfunctorT(new MolecularPotentialFunctor(_mentity))).thresh(_params.thresh * 0.1).truncate_on_project();

       _vnuc = copy(_vnucrhon);

     }

     //*************************************************************************


     //*************************************************************************

     void make_nuclear_charge_density_impl()

     {

       std::vector<coordT> specialpts;

       for (int i = 0; i < _mentity.natom(); i++)

       {

         coordT pt(0.0);

         Atom atom = _mentity.get_atom(i);

         pt[0] = atom.x; pt[1] = atom.y; pt[2] = atom.z;

         specialpts.push_back(pt);

         if (_world.rank() == 0) print("Special point: ", pt);

       }

       double now = wall_time();

       std::cout << "THE FUNCTOR IS " << MolecularNuclearChargeDensityFunctor(_mentity, _params.L, _params.periodic, specialpts)(specialpts[0]) << endl;

       // WSTHORNTON

       //MADNESS_ASSERT(false);


       _vnucrhon = rfactoryT(_world).functor(

           rfunctorT(new MolecularNuclearChargeDensityFunctor(_mentity, _params.L, _params.periodic, specialpts))).

           thresh(_params.thresh).initial_level(6).truncate_on_project();


       if (_world.rank() == 0) printf("%f\n", wall_time() - now);

       if (_world.rank() == 0) print("calculating trace of rhon ..\n\n");

       double rtrace = _vnucrhon.trace();

       if (_world.rank() == 0) print("rhon trace = ", rtrace);

       now = wall_time();

       _vnucrhon.truncate();

       _vnuc = apply(*_cop, _vnucrhon);

       if (_world.rank() == 0) printf("%f\n", wall_time() - now);

       if (_world.rank() == 0) print("Done creating nuclear potential ..\n");


       // WSTHORNTON

       rfunctionT vnuc2 = rfactoryT(_world).functor(rfunctorT(new

           MolecularPotentialFunctor(_mentity))).

           thresh(_params.thresh * 0.1).truncate_on_project();

       rfunctionT vnucdiff = _vnuc-vnuc2;

       double t1 = vnucdiff.trace();

       if (_world.rank() == 0) printf("Difference in nuclear potential: %15.8f\n\n", t1);

       for (int i = 0; i < 101; i++)

       {

         double dx = _params.L/100;

         double pt2 = -_params.L/2 + dx*i;

         coordT cpt(pt2);

         double val = vnucdiff(cpt);

         if (_world.rank() == 0) printf("%10.5f    %15.8f\n",pt2,val);

       }

       //MADNESS_ASSERT(false);

     }

     //*************************************************************************


     //*************************************************************************

     void make_nuclear_potential()

     {

       // Make coulomb operator

       _cop = CoulombOperatorPtr(_world, _params.lo, FunctionDefaults<3>::get_thresh() * 0.1);


       Tensor<double> csize = FunctionDefaults<3>::get_cell();

       if (_world.rank() == 0)

       {

         printf("Cell parameters\n");

         printf("------------------------------\n");

         print("cell(x) is ",csize(0,0), csize(0,1));

         print("cell(y) is ",csize(1,0), csize(1,1));

         print("cell(z) is ",csize(2,0), csize(2,1));

         printf("\n");

       }

       if (_params.ispotential) // potential

       {

         make_nuclear_potential_impl();

       }

       else // charge density

       {

         make_nuclear_charge_density_impl();

       }

     }

     //*************************************************************************


     //*************************************************************************

     struct GuessDensity : public FunctionFunctorInterface<double,3> {

         const MolecularEntity& mentity;

         const AtomicBasisSet& aobasis;

         double R;

         const bool periodic;


         double operator()(const coordT& x) const

         {

           double value = 0.0;

           if (periodic)

           {

             for (int xr = -2; xr <= 2; xr += 1)

             {

               for (int yr = -2; yr <= 2; yr += 1)

               {

                 for (int zr = -2; zr <= 2; zr += 1)

                 {

                   value += aobasis.eval_guess_density(mentity,

                       x[0]+xr*R, x[1]+yr*R, x[2]+zr*R);

                 }

               }

             }

           }

           else

           {

             value = aobasis.eval_guess_density(mentity, x[0], x[1], x[2]);

           }

           return value;

         }


         GuessDensity(const MolecularEntity& mentity, const AtomicBasisSet& aobasis,

             const double& R, const bool& periodic)

         : mentity(mentity), aobasis(aobasis), R(R), periodic(periodic) {}

     };

     //*************************************************************************


     //*************************************************************************

     template <typename Q>

     void test_periodicity(const Function<Q,3>& f)

     {

       int npts = 101;

       double eps = 1e-8;

       coordT r(0.0);

       double delta = _params.L/(npts-1);

       double begin = -_params.L/2;

       double end = _params.L/2;

       double tol = 1e-6;

       // x-axis

       printf("periodicity along x-axis:  \n");

       printf("-------------------------------------------------------------\n\n");

       for (int i = 0; i < npts; i++)

       {

         printf("\n-------------------- edge --------------------\n");

         for (int j = 0; j < npts; j++)

         {

           coordT r1, r2, dr1, dr2;

           r1[0] = begin+eps; r1[1] = (i*delta)+begin; r1[2] = (j*delta)+begin;

           r2[0] = end-eps; r2[1] = (i*delta)+begin; r2[2] = (j*delta)+begin;

           dr1[0] = begin+2*eps; dr1[1] = (i*delta)+begin; dr1[2] = (j*delta)+begin;

           dr2[0] = end-2*eps; dr2[1] = (i*delta)+begin; dr2[2] = (j*delta)+begin;

           double val = std::abs(f(r1)-f(r2));

           std::string success = val < tol ? "PASS!" : "FAIL!";

           printf("%10.6f%10.6f%10.6f  %10.6f%10.6f%10.6f  %10.5e   %s\n",

               r1[0],r1[1],r1[2],r2[0],r2[1],r2[2],val,success.c_str());

         }

       }

       // y-axis

       printf("\nperiodicity along y-axis:  \n");

       printf("-------------------------------------------------------------\n\n");

       for (int i = 0; i < npts; i++)

       {

         printf("\n-------------------- edge --------------------\n");

         for (int j = 0; j < npts; j++)

         {

           coordT r1, r2, dr1, dr2;

           r1[0] = (i*delta)+begin; r1[1] = begin+eps; r1[2] = (j*delta)+begin;

           r2[0] = (i*delta)+begin; r2[1] = end-eps; r2[2] = (j*delta)+begin;

           dr1[0] = (i*delta)+begin; dr1[1] = begin+2*eps; dr1[2] = (j*delta)+begin;

           dr2[0] = (i*delta)+begin; dr2[1] = end-2*eps; dr2[2] = (j*delta)+begin;

           double val = std::abs(f(r1)-f(r2));

           std::string success = val < tol ? "PASS!" : "FAIL!";

           printf("%10.6f%10.6f%10.6f  %10.6f%10.6f%10.6f  %10.5e   %s\n",

               r1[0],r1[1],r1[2],r2[0],r2[1],r2[2],val,success.c_str());

         }

       }

       // z-axis

       printf("\nperiodicity along z-axis:  \n");

       printf("-------------------------------------------------------------\n\n");

       for (int i = 0; i < npts; i++)

       {

         printf("\n-------------------- edge --------------------\n");

         for (int j = 0; j < npts; j++)

         {

           coordT r1, r2, dr1, dr2;

           r1[0] = (i*delta)+begin; r1[1] = (j*delta)+begin; r1[2] = begin+eps;

           r2[0] = (i*delta)+begin; r2[1] = (j*delta)+begin; r2[2] = end-eps;

           dr1[0] = (i*delta)+begin; dr1[1] = (j*delta)+begin; dr1[2] = begin+2*eps;

           dr2[0] = (i*delta)+begin; dr2[1] = (j*delta)+begin; dr2[2] = end-2*eps;

           double val = std::abs(f(r1)-f(r2));

           std::string success = val < tol ? "PASS!" : "FAIL!";

           printf("%10.6f%10.6f%10.6f  %10.6f%10.6f%10.6f  %10.5e   %s\n",

               r1[0],r1[1],r1[2],r2[0],r2[1],r2[2],val,success.c_str());

         }

       }

     }

     //*************************************************************************


     //*************************************************************************

     rfunctionT

     make_lda_potential(World& world,

                        const rfunctionT& arho,

                        const rfunctionT& brho,

                        const rfunctionT& adelrhosq,

                        const rfunctionT& bdelrhosq)

     {

   //      MADNESS_ASSERT(!_params.spinpol);

         rfunctionT vlda = copy(arho);

 //        vlda.unaryop(&::libxc_ldaop<double>);

         vlda.unaryop(&::ldaop<double>);

         return vlda;

     }


     vecfuncT project_ao_basis(World& world, KPoint kpt) {

         vecfuncT ao(_aobasis.nbf(_mentity));


 //        Level initial_level = 3;

 //        for (int i=0; i < _aobasis.nbf(_mentity); i++) {

 //          functorT aofunc(new AtomicBasisFunctor(_aobasis.get_atomic_basis_function(_mentity,i),

 //              _params.L, _params.periodic, kpt));

 //            ao[i] = factoryT(world).functor(aofunc).initial_level(initial_level).truncate_on_project().nofence();

 //        }

 //        world.gop.fence();


 //        WSTAtomicBasisFunctor aofunc(_aobasis.get_atomic_basis_function(_mentity,4),

 //            _params.L, kpt.k[0], kpt.k[1], kpt.k[2]);

 //        coord_3d p(5e-2);

 //        double_complex val = aofunc(p);

 //        print("AO_PROJECT: val is ", val);

 //        MADNESS_ASSERT(false);


         for (int i=0; i < _aobasis.nbf(_mentity); i++) {

           functorT aofunc(new WSTAtomicBasisFunctor(_aobasis.get_atomic_basis_function(_mentity,i),

               _params.L, kpt.k[0], kpt.k[1], kpt.k[2]));

             ao[i] = factoryT(world).functor(aofunc).truncate_on_project().truncate_mode(0);

         }

         world.gop.fence();


 //        std::vector<double> norms;

 //        norms = norm2s(world, ao);

 //        for (int i=0; i<_aobasis.nbf(_mentity); i++) {

 //            if (world.rank() == 0 && fabs(norms[i]-1.0)>1e-3) print(i," bad ao norm?", norms[i]);

 //            norms[i] = 1.0/norms[i];

 //        }

 //

 //        scale(world, ao, norms);

 //        norms = norm2s(world, ao);

 //        for (int i=0; i<_aobasis.nbf(_mentity); i++) {

 //            if (world.rank() == 0 && fabs(norms[i]-1.0)>1e-3) print(i," bad ao norm?", norms[i]);

 //            norms[i] = 1.0/norms[i];

 //        }

 //        scale(world, ao, norms);


         return ao;

     }

     //*************************************************************************


     //*************************************************************************

     // Constructor

     Solver(World& world,

            rfunctionT vnucrhon,

            vecfuncT phisa,

            vecfuncT phisb,

            std::vector<T> eigsa,

            std::vector<T> eigsb,

            ElectronicStructureParams params,

            MolecularEntity mentity)

        : _world(world), _vnucrhon(vnucrhon), _phisa(phisa), _phisb(phisb),

        _eigsa(eigsa), _eigsb(eigsb), _params(params), _mentity(mentity)

     {

       _residual = 1e5;

       _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);


       if (params.ispotential)

       {

         _vnuc = copy(_vnucrhon);

       }

       else

       {

         _vnuc = apply(*_cop, _vnucrhon);

       }

     }

     //*************************************************************************


     //*************************************************************************

     void initial_guess()

     {

       // Get initial guess for the electronic density

       if (_world.rank() == 0) print("Guessing rho ...\n\n");


       rfunctionT rho = rfactoryT(_world);

       if (_params.restart == 0)

       {

         rho = rfactoryT(_world).functor(rfunctorT(new GuessDensity(_mentity,

               _aobasis, _params.L, _params.periodic))).initial_level(3);

       }

       else

       {

         MADNESS_EXCEPTION("restart not working right now!",0);

       }

       // This is a cheat

       rho.scale(_params.ncharge/rho.trace());


       char fname3[25];

       coord_3d rp1(-_params.L/2);

       coord_3d rp2(_params.L/2);

       plot_line(fname3,101,rp1,rp2,rho);


       // load balance

       //if(_world.size() > 1) {

       //    START_TIMER(_world);

       //    LoadBalanceDeux<3> lb(_world);

       //    lb.add_tree(_vnuc, lbcost<double,3>(1.0, 0.0), false);

       //    lb.add_tree(rho, lbcost<double,3>(1.0, 1.0), true);


       //    FunctionDefaults<3>::redistribute(_world, lb.load_balance(6.0));

       //}


       if (_params.restart != 1)

       {

         // build effective potential

         rfunctionT vlocal;

         // Is this a many-body system?

         if (_params.ncharge > 1.0)

         {

           if (_world.rank() == 0) print("Creating Coulomb op ...\n\n");

           SeparatedConvolution<double, 3>* op = 0;

           // Is this system periodic?

           if (_params.periodic)

           {

             Tensor<double> cellsize = FunctionDefaults<3>::get_cell_width();

             //op = PeriodicCoulombOpPtr<double, 3> (_world, _params.waveorder,

             //    _params.lo, _params.thresh * 0.1, cellsize);

             op = CoulombOperatorPtr(_world, _params.lo, _params.thresh * 0.1);

           }

           else

           {

             op = CoulombOperatorPtr(_world, _params.lo, _params.thresh * 0.1);

           }

           if (_world.rank() == 0) print("Building effective potential ...\n\n");

           rfunctionT vc = apply(*op, rho);

           vlocal = _vnuc + vc; //.scale(1.0-1.0/nel); // Reduce coulomb to increase binding

           rho.scale(0.5);

           // WSTHORNTON

           _rhoa = rho;

           _rhob = rho;

           // Do the LDA

           rfunctionT vlda = make_lda_potential(_world, rho, rho, rfunctionT(), rfunctionT());

           vlocal = vlocal + vlda;

           delete op;

         }

         else

         {

           vlocal = _vnuc;

         }


         // Clear these functions

 //        rho.clear();

         vlocal.reconstruct();


         // Get size information from k-points and ao_basis so that we can correctly size

         // the _orbitals data structure and the eigs tensor

         // number of orbitals in the basis set

         int _nao = _aobasis.nbf(_mentity);


         // number of kpoints

         int nkpts = _kpoints.size();

         // total number of orbitals to be processed (no symmetry)

         int norbs = _params.nbands * nkpts;

         // Check to see if the basis set can accomodate the number of bands

         if (_params.nbands > _nao)

           MADNESS_EXCEPTION("Error: basis not large enough to accomodate number of bands", _nao);

         // set the number of orbitals

         _eigsa = std::vector<double>(norbs, 0.0);

         _eigsb = std::vector<double>(norbs, 0.0);

         _occsa = std::vector<double>(norbs, 0.0);

         _occsb = std::vector<double>(norbs, 0.0);

         if (_world.rank() == 0) print("Building kinetic energy matrix ...\n\n");

         // Need to do kinetic piece for every k-point

         for (int ki = 0; ki < nkpts; ki++)

         {

           // These are our initial basis functions

           if (_world.rank() == 0) print("Projecting atomic orbitals ...\n\n");

           START_TIMER(_world);

           cvecfuncT ao = project_ao_basis(_world, _kpoints[ki]);

           END_TIMER(_world, "projecting atomic orbital basis");

 //          for (unsigned int iao = 0; iao < _nao; iao)

 //          {

 //            _aobasisf.push_back(ao[iao]);

 //          }


           for (unsigned int ai = 0; ai < ao.size(); ai++)

           {

             std::vector<long> npt(3,101);

             char fnamedx[50];

             sprintf(fnamedx, "aofunc_k_%2.2d__%2.2d__.dx",ki,ai);

             std::vector<long> npt2(3,101);

             plotdx(ao[ai], fnamedx, FunctionDefaults<3>::get_cell(), npt2);

           }


           coord_3d p1(-_params.L/2);

           coord_3d p2(_params.L/2);

           for (int i = 0; i < ao.size(); i++)

           {

             char fname[25];

             sprintf(fname, "ao_line_%d.txt",i);

             plot_line(fname,101,p1,p2,ao[i]);

           }

           char fname2[25];

           sprintf(fname2, "vnuc_line.txt");

           plot_line(fname2,101,p1,p2,_vnuc);

           char fname3[25];

           sprintf(fname3, "vlocal_line.txt");

           plot_line(fname3,101,p1,p2,vlocal);


           // load balancing

           //if(_world.size() > 1)

           //{

           //  LoadBalanceDeux<3> lb(_world);

           //  lb.add_tree(_vnuc, lbcost<double,3>(1.0, 1.0), false);

           //  for(unsigned int i = 0; i < ao.size(); i++)

           //  {

           //      lb.add_tree(ao[i], lbcost<valueT,3>(1.0, 1.0), false);

           //  }


           //  FunctionDefaults<3>::redistribute(_world, lb.load_balance(6.0));

           //}


           // Get k-point from list

           KPoint& kpoint = _kpoints[ki];


           // WSTHORNTON

 //          ctensorT S = matrix_inner(_world,ao,ao,true);

 //          print(S);

 //          ctensorT U = csqrt(S);

 //          ao = transform(_world, ao, U, _params.thresh, true);


           // Build kinetic matrx

           //ctensorT kinetic = ::kinetic_energy_matrix_slow<T,NDIM>(_world, ao, _params.periodic, kpt);

           ctensorT kinetic = ::kinetic_energy_matrix_slow<T,NDIM>(_world, ao, _params.periodic, kpoint);

           // Build the overlap matrix

           if (_world.rank() == 0) print("Building overlap matrix ...\n\n");

           ctensorT overlap = matrix_inner(_world, ao, ao, true);

           // Build the potential matrix

           reconstruct(_world, ao);

           if (_world.rank() == 0) print("Building potential energy matrix ...\n\n");

           //cvecfuncT vpsi = mul_sparse(_world, vlocal, ao, _params.thresh);

           cvecfuncT vpsi;

           for (int i = 0; i < ao.size(); i++)

             vpsi.push_back(vlocal*ao[i]);

           _world.gop.fence();

           compress(_world, vpsi);

           truncate(_world, vpsi);

           compress(_world, ao);

           // Build the potential matrix

           ctensorT potential = matrix_inner(_world, vpsi, ao, true);

           _world.gop.fence();

           // free memory

           vpsi.clear();

           _world.gop.fence();


           // Construct and diagonlize Fock matrix

           ctensorT fock = potential + kinetic;

           ctensorT fockzero = fock-conj_transpose(fock);

           if (_world.rank() == 0)

           {

             print("Kinetic:");

             print(kinetic);

             print("Potential:");

             print(potential);

             print("Fock: (pre-symmetrized)");

             print(fock);

             print("FockZero: (should be zero)");

             print(fockzero);

             print("Overlap:");

             print(overlap);

           }

           fock = 0.5 * (fock + conj_transpose(fock));

           for (unsigned int i = 0; i < fock.dim(0); i++)

           {

             fock(i,i) += i*_params.thresh*0.1;

           }


           ctensorT c; rtensorT e;

           sygv(fock, overlap, 1, c, e);


           // diagonlize kinetic

           ctensorT ck; rtensorT ek;

           sygv(kinetic, overlap, 1, ck, ek);

           // diagonalize potential

           ctensorT cp; rtensorT ep;

           sygv(potential, overlap, 1, cp, ep);

           // diagonalize overlap

           ctensorT co; rtensorT eo;

           syev(overlap, co, eo);


           if (_world.rank() == 0)

           {

             print("fock eigenvectors dims:",c.dim(0),c.dim(1));

             print("fock eigenvectors:");

             print(c);

           }


           if (_world.rank() == 0)

           {

             print("kinetic eigenvalues");

             print(ek);

           }


           if (_world.rank() == 0)

           {

             print("potential eigenvalues");

             print(ep);

           }


           if (_world.rank() == 0)

           {

             print("overlap eigenvalues");

             print(eo);

           }

           if (_world.rank() == 0)

           {

             print("fock eigenvalues");

             print(e);

           }


           if (_world.rank() == 0)

           {

             printf("Overlap: \n");

             for (int i = 0; i < overlap.dim(0); i++)

                 {

                     for (int j = 0; j < overlap.dim(1); j++)

                         {

                             printf("%10.5f", real(overlap(i,j)));

                         }

                     printf("\n");

                 }

             printf("\n");

             printf("\n");

           }


           compress(_world, ao);

           _world.gop.fence();

           // Take linear combinations of the gaussian basis orbitals as the starting

           // orbitals for solver

           vecfuncT tmp_orbitals = transform(_world, ao, c(_, Slice(0, _nao - 1)));


 //          tmp_orbitals[0] = ao[0];

 //          tmp_orbitals[1] = ao[1];

 //          tmp_orbitals[2] = ao[2];

 //          tmp_orbitals[3] = ao[3];

 //          tmp_orbitals[4] = ao[4];


           // WSTHORNTON

           // checking the symmetry

 //          int npts = 101;

 //          double delta = _params.L/(npts-1);

 //          double begin = -_params.L/2;

 //          double end = _params.L/2;

 //          double tol = 1e-6;

 //

 //          for (int i = 0; i < npts; i++)

 //          {

 //            double x = (i*delta)+begin;

 //            for (int j = 0; j < npts; j++)

 //            {

 //              double y = (j*delta)+begin;

 //              for (int k = 0; k < npts; k++)

 //              {

 //                double z = (k*delta)+begin;

 //                coord_3d r1 = vec(x,y,z);

 //                coord_3d r2 = vec(y,x,z);

 //                coord_3d r3 = vec(z,y,x);

 //                coord_3d r4 = vec(x,z,y);

 //                double_complex pxr2 = ao[2](r2); double_complex pyr1 = ao[3](r1);

 //                double_complex pxr3 = ao[2](r3); double_complex pzr1 = ao[4](r1);

 //                double_complex pyr4 = ao[3](r4);

 //                double err_xy = std::abs(pxr2-pyr1);

 //                double err_xz = std::abs(pxr3-pzr1);

 //                std::string success = err_xy < tol ? "PASS!" : "FAIL!";

 //                printf("%10.4e + %10.4e     %10.4e + %10.4e     %15.8e\n     %s\n",

 //                    std::real(pxr2), std::imag(pxr2), std::real(pyr1), std::imag(pyr1),

 //                    err_xy, success.c_str());

 //              }

 //            }

 //          }


 //          MADNESS_ASSERT(false);


           // WSTHORNTON

 //          const double PI_OVER_8 = madness::constants::pi/8;

 //          SeparatedConvolution<double,3> op = CoulombOperator(_world, _params.lo, _params.thresh * 0.1);

 //          rfunctionT vlda = make_lda_potential(_world, rho, rho, rfunctionT(), rfunctionT());

 //          rho.scale(2.0);

 //          rfunctionT vc2 = apply(op,rho);

 //          double rtr2 = rho.trace();

 //          rfunctionT vlocal2 = vc2 + _vnuc;

 //

 //          SeparatedConvolution<double,3> op2 = CoulombOperator(_world, _params.lo, _params.thresh * 0.1);

 //          SeparatedConvolution<double,3> bshop = BSHOperator3D(_world, -0.2, _params.lo, _params.thresh * 0.1);


 //          if (_world.rank() == 0)

 //          {

 //            print("trace of rho:");

 //            print(rtr2);

 //          }

 //          for (int i = 0; i < 5; i++)

 //          {

 //            double th = i*PI_OVER_8;

 //            tmp_orbitals[2] = ao[2];

 //            tmp_orbitals[3] = cos(th)*ao[3] + sin(th)*ao[4];

 //            tmp_orbitals[4] = -sin(th)*ao[3] + cos(th)*ao[4];

 //

 //            ctensorT fred(3,3);

 //            for (int ii = 2; ii < 5; ii++)

 //            {

 //              for (int jj = 2; jj < 5; jj++)

 //              {

 //                fred(ii-2,jj-2) = inner(tmp_orbitals[ii], _vnuc*tmp_orbitals[jj]);

 //                if (std::abs(fred(ii-2,jj-2)) < 1e-6)

 //                  fred(ii-2,jj-2) = std::complex<double>(0.0,0.0);

 //

 //              }

 //            }


 //            complex_derivative_3d Dx(_world,0);

 //            complex_derivative_3d Dy(_world,1);

 //            complex_derivative_3d Dz(_world,2);

 //

 //            ctensorT fred(3,3);

 //            std::complex<double> I = std::complex<double>(0.0,1.0);

 //            std::complex<double> one = std::complex<double>(1.0,0.0);

 //            for (int ii = 2; ii < 5; ii++)

 //            {

 //              for (int jj = 2; jj < 5; jj++)

 //              {

 //                double ksq = kpoint.k[0]*kpoint.k[0] +

 //                    kpoint.k[1]*kpoint.k[1] +

 //                    kpoint.k[2]*kpoint.k[2];

 //

 //                cfunctionT ct1 = -I*kpoint.k[0]*Dx(tmp_orbitals[jj]) -

 //                  I*kpoint.k[1]*Dy(tmp_orbitals[jj]) -

 //                  I*kpoint.k[2]*Dz(tmp_orbitals[jj]);

 //

 //                cfunctionT ct2 = -0.5*Dx(Dx(tmp_orbitals[jj])) +

 //                    Dy(Dy(tmp_orbitals[jj])) +

 //                    Dz(Dz(tmp_orbitals[jj]));

 //

 //                cfunctionT ct3 = 0.5*ksq*tmp_orbitals[jj];

 //

 //                fred(ii-2,jj-2) = inner(tmp_orbitals[ii], ct1+ct2+ct3);

 //                if (std::abs(fred(ii-2,jj-2)) < 1e-6)

 //                  fred(ii-2,jj-2) = std::complex<double>(0.0,0.0);

 //              }

 //            }


 //            ctensorT cf; rtensorT ef;

 //            syev(fred, cf, ef);

 //

 //            if (_world.rank() == 0)

 //            {

 //                print("Fred:", i);

 //                print(fred);

 //                print("eigenvalues:");

 //                print(ef);

 //                print("eigenvectors:");

 //                print(cf);

 //            }

 //          }

 //          MADNESS_ASSERT(false);


           _world.gop.fence();

           truncate(_world, tmp_orbitals);

           normalize(_world, tmp_orbitals);


           // Build the overlap matrix

           if (_world.rank() == 0) print("Building overlap matrix ...\n\n");

           ctensorT overlap2 = matrix_inner(_world, tmp_orbitals, tmp_orbitals, true);


           rtensorT tmp_eigs = e(Slice(0, _nao - 1));


           if (_world.rank() == 0) printf("(%8.4f,%8.4f,%8.4f)\n",kpoint.k[0], kpoint.k[1], kpoint.k[2]);

           if (_world.rank() == 0) print(tmp_eigs);

           if (_world.rank() == 0) print("\n");


           //if (_world.rank() == 0) print("kinetic energy for kp = ", kp);

           //if (_world.rank() == 0) print(kinetic);

           //if (_world.rank() == 0) print("\n");


           // DEBUG

           if (_world.rank() == 0) {

               printf("Overlap: \n");

               for (int i = 0; i < kinetic.dim(0); i++)

                   {

                       for (int j = 0; j < kinetic.dim(1); j++)

                           {

                               printf("%10.5f", real(overlap(i,j)));

                           }

                       printf("\n");

                   }

               printf("\n");

               printf("\n");


               printf("Kinetic: \n");

               for (int i = 0; i < kinetic.dim(0); i++)

                   {

                       for (int j = 0; j < kinetic.dim(1); j++)

                           {

                               printf("%10.5f", real(kinetic(i,j)));

                           }

                       printf("\n");

                   }

               printf("\n");

               printf("\n");


               printf("V: \n");

               for (int i = 0; i < potential.dim(0); i++)

                   {

                       for (int j = 0; j < potential.dim(1); j++)

                           {

                               printf("%10.5f", real(potential(i,j)));

                           }

                       printf("\n");

                   }

               printf("\n");

               printf("\n");


               printf("Fock: \n");

               for (int i = 0; i < fock.dim(0); i++)

                   {

                       for (int j = 0; j < fock.dim(1); j++)

                           {

                               printf("%10.5f", real(fock(i,j)));

                           }

                       printf("\n");

                   }

               printf("\n");

               printf("\n");


               printf("New overlap: \n");

               for (int i = 0; i < overlap2.dim(0); i++)

                   {

                       for (int j = 0; j < overlap2.dim(1); j++)

                           {

                               printf("%10.5f", real(overlap2(i,j)));

                           }

                       printf("\n");

                   }

               printf("\n");

               printf("\n");

           }


           // Fill in orbitals and eigenvalues

           kpoint.begin = ki*_params.nbands;

           kpoint.end = (ki+1)*_params.nbands;

           for (unsigned int oi = kpoint.begin, ti = 0; oi < kpoint.end; oi++, ti++)

           {

             //if (_world.rank() == 0) print(oi, ti, kpt.begin, kpt.end);

             // normalize the orbitals

             //tmp_orbitals[ti].scale(1.0/tmp_orbitals[ti].norm2());

             _phisa.push_back(tmp_orbitals[ti]);

             _phisb.push_back(tmp_orbitals[ti]);

             _eigsa[oi] = tmp_eigs[ti];

             _eigsb[oi] = tmp_eigs[ti];

           }

         }

       }

     }

     //*************************************************************************


     //*************************************************************************

     // Constructor

     Solver(World& world,

            const rfunctionT& vnucrhon,

            const vecfuncT& phis,

            const std::vector<T>& eigs,

            const ElectronicStructureParams& params,

            MolecularEntity mentity)

        : _world(world), _vnucrhon(vnucrhon), _phisa(phis), _phisb(phis),

        _eigsa(eigs), _eigsb(eigs), _params(params), _mentity(mentity)

     {

       _residual = 1e5;

       if (params.periodic)

       {

         Tensor<double> box = FunctionDefaults<NDIM>::get_cell_width();

         //_cop = PeriodicCoulombOpPtr<T,NDIM>(const_cast<World&>(world),

         //    FunctionDefaults<NDIM>::get_k(), params.lo, params.thresh * 0.1, box);

         _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

       }

       else

       {

         _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

       }


       if (params.ispotential)

       {

         _vnuc = copy(_vnucrhon);

       }

       else

       {

         _vnuc = apply(*_cop, _vnucrhon);

       }

     }

     //*************************************************************************


     //*************************************************************************

     // Constructor

     Solver(World& world,

            rfunctionT vnucrhon,

            vecfuncT phis,

            std::vector<T> eigs,

            std::vector<KPoint> kpoints,

            std::vector<double> occs,

            ElectronicStructureParams params,

            MolecularEntity mentity)

        : _world(world), _vnucrhon(vnucrhon), _phisa(phis), _phisb(phis),

          _eigsa(eigs), _eigsb(eigs), _params(params),

          _kpoints(kpoints), _occsa(occs), _occsb(occs), _mentity(mentity)

     {

       _residual = 1e5;

       if (params.periodic)

       {

         Tensor<double> box = FunctionDefaults<NDIM>::get_cell_width();

         _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

       }

       else

       {

         _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

       }


       if (params.ispotential)

       {

         _vnuc = copy(_vnucrhon);

       }

       else

       {

         _vnuc = apply(*_cop, _vnucrhon);

       }

     }

     //*************************************************************************


     //*************************************************************************

     virtual ~Solver()

     {

       _outputF.close();

       _matF.close();

       _eigF.close();

       delete _subspace;

     }

     //*************************************************************************


     //***************************************************************************

     // set occupation numbers (only for insulators ... no smearing)

     void set_occs2(const std::vector<KPoint>& kpoints,

                    const std::vector<double>& eigsa,

                    const std::vector<double>& eigsb,

                    std::vector<double>& occsa,

                    std::vector<double>& occsb)

     {

       for (unsigned int ik = 0; ik < kpoints.size(); ik++)

       {

         // get k-point

         KPoint k = kpoints[ik];


         // pull subset of data that corresponds to k

         const std::vector<double> k_eigsa(eigsa.begin() + k.begin, eigsa.begin() + k.end);

         const std::vector<double> k_eigsb(eigsb.begin() + k.begin, eigsb.begin() + k.end);

         std::vector<double> k_occsa(occsa.begin() + k.begin, occsa.begin() + k.end);

         std::vector<double> k_occsb(occsb.begin() + k.begin, occsb.begin() + k.end);


         // demand all vectors have the same size

         unsigned int sz = k_eigsa.size();

         MADNESS_ASSERT(k_eigsb.size() == sz);

         MADNESS_ASSERT(k_occsa.size() == sz);

         MADNESS_ASSERT(k_occsb.size() == sz);

         // concatenate eigenvalues

         std::vector<double> teigs;

         //std::copy(k_eigsa.begin(), k_eigsa.end(), teigs.begin());

         //teigs.insert(teigs.end(), k_eigsb.begin(), k_eigsb.end());

         //std::copy(k_eigsb.begin(), k_eigsb.end(), back_inserter(teigs));

         for (unsigned int ist = 0; ist < k_eigsa.size(); ist++) teigs.push_back(k_eigsa[ist]);

         for (unsigned int ist = 0; ist < k_eigsb.size(); ist++) teigs.push_back(k_eigsb[ist]);


         if (_world.rank() == 0) printf("setting occs ....\n\n");

         for (unsigned int ist = 0; ist < teigs.size(); ist++)

         {

           if (_world.rank() == 0)

           {

             printf("%5d    %15.8f\n", ist, teigs[ist]);

           }

         }


         // indicies

         std::vector<unsigned int> inds(2*sz);

         for (unsigned int i = 0; i < 2*sz; i++) inds[i] = i;

         // sort by eigenvalue

         for (unsigned int i = 0; i < 2*sz; i++)

         {

           for (unsigned int j = i+1; j < 2*sz; j++)

           {

             if (teigs[j] < teigs[i])

             {

               double t1 = teigs[i];

               teigs[i] = teigs[j];

               teigs[j] = t1;

               int it1 = inds[i];

               inds[i] = inds[j];

               inds[j] = it1;

             }

           }

         }


         if (_world.rank() == 0)

           printf("\nSorted eigenvalues:\n");

         for (unsigned int i = 0; i < teigs.size(); i++)

         {

           if (_world.rank() == 0)

             printf("%10d%10d     %15.8f\n",i,inds[i],teigs[i]);

         }


         // assign occupation numbers

         double availablecharge = _params.ncharge;

         for (unsigned int i = 0; (i < 2*sz) && (availablecharge > 0.0) ; i++)

         {

           unsigned int current = inds[i];

           if (current >= sz)

           {

             current -= sz;

             k_occsb[current] = 1.0;

             availablecharge -= 1.0;

           }

           else

           {

             k_occsa[current] = 1.0;

             availablecharge -= 1.0;

           }

         }


         for (unsigned int ik1 = k.begin, ik2 = 0; ik1 < k.end; ik1++,ik2++)

         {

           occsa[ik1] = k_occsa[ik2];

           occsb[ik1] = k_occsb[ik2];

         }

       }


       for (unsigned int ik = 0; ik < kpoints.size(); ik++)

       {

         KPoint k = kpoints[ik];

         if (_world.rank() == 0)

         {

           printf("k-point is: %d: \n",ik);

         }

         for (unsigned int ist = k.begin; ist < k.end; ist++)

         {

           if (_world.rank() == 0)

           {

             printf("occa:    %12.5f          occb:    %12.5f \n",occsa[ist],occsb[ist]);

           }

         }

       }


     }

     //***************************************************************************


     //***************************************************************************

     rfunctionT compute_rho_slow(const vecfuncT& phis, std::vector<KPoint> kpoints,

                                std::vector<double> occs)

     {

       // Electron density

       rfunctionT rho = rfactoryT(_world);

       _world.gop.fence();

       if (_world.rank() == 0) _outputF << "computing rho ..." << endl;

       // Loop over k-points

       for (unsigned int kp = 0; kp < kpoints.size(); kp++)

       {

         // get k-point

         KPoint kpoint = kpoints[kp];

         // loop through bands

         for (unsigned int j = kpoint.begin; j < kpoint.end; j++)

         {

           // Get phi(j) from iterator

           const functionT& phij = phis[j];

           // Compute the j-th density

           //rfunctionT prod = abs_square(phij);

           rfunctionT prod = abssq(phij,true);

           double rnrm = prod.trace();

           prod.scale(1/rnrm);

 //          rho += 0.5 * _occs[j] * kpoint.weight * prod;

           rho += occs[j] * kpoint.weight * prod;

         }

       }

       rho.truncate();


       return rho;

     }


     // computes the electronic density for 1 spin

     rfunctionT compute_rho(const vecfuncT& phis, std::vector<KPoint> kpoints,

                           std::vector<double> occs)

     {

       if (_world.rank() == 0) _outputF << "computing rho ..." << endl;

       rfunctionT rho = rfactoryT(_world);       // Electron density


       reconstruct(_world, phis); // For max parallelism

       std::vector<rfunctionT> phisq(phis.size());

       for (unsigned int i=0; i<phis.size(); i++) {

           phisq[i] = abssq(phis[i],false);

       }

       _world.gop.fence();

       std::vector<double> phinorm = norm2s(_world, phis);


       compress(_world,phisq); // since will be using gaxpy for accumulation

       rho.compress();


       // Loop over k-points

       for (unsigned int kp = 0; kp < kpoints.size(); kp++)

       {

         // get k-point

         KPoint kpoint = kpoints[kp];

         // loop through bands

         for (unsigned int j = kpoint.begin; j < kpoint.end; j++)

         {

           rho.gaxpy(1.0, phisq[j], occs[j] * kpoint.weight / (phinorm[j]*phinorm[j]), false);

         }

       }

       _world.gop.fence();

       phisq.clear();

       rho.truncate();


       return rho;

     }


     //***************************************************************************


     //***************************************************************************

     std::vector<poperatorT> make_bsh_operators(const std::vector<T>& eigs)

     {

       // Make BSH vector

       std::vector<poperatorT> bops;

       // Get defaults

       double tol = FunctionDefaults<NDIM>::get_thresh();

       // Loop through eigenvalues, adding a BSH operator to bops

       // for each eigenvalue

       int sz = eigs.size();

       for (int i = 0; i < sz; i++)

       {

           T eps = eigs[i];

           if (eps > 0)

           {

               if (_world.rank() == 0)

               {

                   std::cout << "bsh: warning: positive eigenvalue" << i << eps << endl;

               }

               eps = -0.1;

           }


           bops.push_back(poperatorT(BSHOperatorPtr3D(_world, sqrt(-2.0*eps), _params.lo, tol * 0.1)));

       }

       return bops;

     }

     //*************************************************************************


     //*************************************************************************

 //    void loadbal()

 //    {

 //        if(_world.size() == 1)

 //            return;

 //

 //        LoadBalanceDeux<3> lb(_world);

 //        lb.add_tree(_vnuc, lbcost<double,3>(1.0, 0.0), false);

 //        lb.add_tree(_rhoa, lbcost<double,3>(1.0, 1.0), false);

 //        for(unsigned int i = 0;i < _phisa.size();i++)

 //        {

 //            lb.add_tree(_phisa[i], lbcost<valueT,3>(1.0, 1.0), false);

 //        }

 //        if(_params.spinpol)

 //        {

 //            lb.add_tree(_rhob, lbcost<double,3>(1.0, 1.0), false);

 //            for(unsigned int i = 0;i < _phisb.size();i++)

 //            {

 //                lb.add_tree(_phisa[i], lbcost<valueT,3>(1.0, 1.0), false);

 //            }

 //        }

 //

 //        FunctionDefaults<3>::redistribute(_world, lb.load_balance(6.0));

 //   }

    //*************************************************************************


     //*************************************************************************

     double calculate_kinetic_energy()

     {

       double ke = 0.0;

       if (!_params.periodic)

       {

         complex_derivative_3d Dx(_world,0);

         complex_derivative_3d Dy(_world,1);

         complex_derivative_3d Dz(_world,2);

         for (unsigned int i = 0; i < _phisa.size(); i++)

         {

           functionT dpdx = Dx(_phisa[i]);

           functionT dpdy = Dy(_phisa[i]);

           functionT dpdz = Dz(_phisa[i]);

           ke += 0.5 * (real(inner(dpdx,dpdx)) + real(inner(dpdy,dpdy))

               + real(inner(dpdz,dpdz)));

         }

         if (_params.spinpol)

         {

           for (unsigned int i = 0; i < _phisb.size(); i++)

           {

             functionT dpdx = Dx(_phisb[i]);

             functionT dpdy = Dy(_phisb[i]);

             functionT dpdz = Dz(_phisb[i]);

             ke += 0.5 * (real(inner(dpdx,dpdx)) + real(inner(dpdy,dpdy))

                 + real(inner(dpdz,dpdz)));

           }

         }

         else

         {

           ke *= 2.0;

         }

       }

       return ke;

     }

     //*************************************************************************


     //*************************************************************************

     void apply_potential(vecfuncT& pfuncsa,

         vecfuncT& pfuncsb, const vecfuncT& phisa,

         const vecfuncT& phisb, const rfunctionT& rhoa, const rfunctionT& rhob,

         const rfunctionT& rho)

     {

       // Nuclear and coulomb potentials

       rfunctionT vc = apply(*_cop, rho);


       // combined density

       rfunctionT rho2 = rho + _vnucrhon;

       double vnucrhontrace = _vnucrhon.trace();

       double rhotrace = rho.trace();

       double rho2trace = rho2.trace();

       if (_world.rank() == 0) printf("_vnucrhon trace: %10e\n", vnucrhontrace);

       if (_world.rank() == 0) printf("rho trace: %10e\n", rhotrace);

       if (_world.rank() == 0) printf("rho2 trace: %10e\n", rho2trace);

       rfunctionT vlocal = (_params.ispotential) ? _vnuc + vc : apply(*_cop, rho2);

       rfunctionT vlocal2 = _vnuc + vc;

       double vlerr = (vlocal-vlocal2).norm2();

       if (_world.rank() == 0) printf("vlerr trace: %10e\n\n", vlerr);


       // Calculate energies for Coulomb and nuclear

       double ce = 0.5*inner(vc,rho);

       double pe = inner(_vnuc,rho);

       double xc = 0.0;

       double ke = calculate_kinetic_energy();

       // Exchange

       if (_params.functional == 1)

       {

         // LDA, is calculation spin-polarized?

         if (_params.spinpol)

         {

                 MADNESS_EXCEPTION("Spin polarized not implemented!",0);

 //          // potential

 //          rfunctionT vxca = binary_op(rhoa, rhob, &::libxc_ldaop_sp<double>);

 //          rfunctionT vxcb = binary_op(rhob, rhoa, &::libxc_ldaop_sp<double>);

 //          pfuncsa = mul_sparse(_world, vlocal + vxca, phisa, _params.thresh * 0.1);

 //          pfuncsb = mul_sparse(_world, vlocal + vxcb, phisb, _params.thresh * 0.1);

 //          // energy

 //          rfunctionT fca = binary_op(rhoa, rhob, &::libxc_ldaeop_sp<double>);

 //          rfunctionT fcb = binary_op(rhob, rhoa, &::libxc_ldaeop_sp<double>);

 //          xc = fca.trace() + fcb.trace();

         }

         else

         {

           // potential

           rfunctionT vxc = copy(rhoa);

 //          vxc.unaryop(&::libxc_ldaop<double>);

           START_TIMER(_world);

           vxc.unaryop(&::ldaop<double>);


           //test_periodicity(vc);

 //          for (unsigned int i = 0; i < phisa.size(); i++)

 //          {

 //            test_periodicity(phisa[i]);

 //          }


           pfuncsa = mul_sparse(_world, vlocal2+vxc, phisa, _params.thresh * 0.1);

 //          rfunctionT vxc2 = binary_op(rhoa, rhoa, &::libxc_ldaop_sp<double>);

 //          pfuncsa = mul_sparse(_world, vlocal + vxc2, phisa, _params.thresh * 0.1);


 //          for (unsigned int i = 0; i < pfuncsa.size(); i++)

 //          {

 //            test_periodicity(pfuncsa[i]);

 //          }


           END_TIMER(_world,"Applying LDA potential");

           // energy

           rfunctionT fc = copy(rhoa);

           fc.unaryop(&::ldaeop<double>);

           xc = fc.trace();

         }

       }

       else if (_params.functional == 2)

       {

         START_TIMER(_world);

         pfuncsa = mul_sparse(_world, vlocal, phisa, _params.thresh * 0.1);

         END_TIMER(_world,"Applying local potential");

         START_TIMER(_world);

         // gamma-point?

         if ((_params.ngridk0 == 1) && (_params.ngridk1 == 1) && (_params.ngridk2 == 1))

         {

           apply_hf_exchange3(_phisa, _phisb, pfuncsa, pfuncsb, xc);

         }

         else

         {

           apply_hf_exchange4(_phisa, _phisb, pfuncsa, pfuncsb, xc);

         }

         END_TIMER(_world, "Applying HF exchange");

       }

       std::cout.precision(8);

       if (_world.rank() == 0)

       {

         printf("Energies:\n");

         printf("Kinetic energy:     %20.10f\n", ke);

         printf("Potential energy:   %20.10f\n", pe);

         printf("Coulomb energy:     %20.10f\n", ce);

         printf("Exchange energy:    %20.10f\n", xc);

         printf("Total energy:       %20.10f\n\n", ke + pe + ce + xc);

       }

     }

     //*************************************************************************


     // working for a molecule / atom ... need to test with periodic boundary

     // conditions as a gamma point only calculation

     //*************************************************************************

 //    void apply_hf_exchange2(vecfuncT& phisa, vecfuncT& phisb,

 //                           vecfuncT& funcsa, vecfuncT& funcsb,

 //                           double& xc)

 //    {

 //      Vector<double,3> q = vec(0.0,0.0,0.0);

 //      SeparatedConvolution<double_complex,3> hfexop =

 //          PeriodicHFExchangeOperator(_world, q, _params.lo,

 //              FunctionDefaults<3>::get_thresh() * 0.1);

 //      for (unsigned int i = 0; i < phisa.size(); i++)

 //      {

 //        bool isreal1 = is_real<T,NDIM>(phisa[i]);

 //        MADNESS_ASSERT(isreal1);

 //        for (unsigned int j = 0; j < phisa.size(); j++)

 //        {

 //          bool isreal2 = is_real<T,NDIM>(phisa[j]);

 //          MADNESS_ASSERT(isreal2);

 //          functionT prod = phisa[i]*phisa[j];

 //          prod.truncate();

 //          rfunctionT Vex = real(apply(hfexop,prod));

 //          functionT tf1 = Vex*phisa[j];

 //          funcsa[i] -= tf1;

 //          xc -= real(inner(phisa[i],tf1));

 //        }

 //      }

 //    }

     //*************************************************************************


     // working for a molecule / atom ... works for a gamma point calculation

     //*************************************************************************

     void apply_hf_exchange3(vecfuncT& phisa, vecfuncT& phisb,

                             vecfuncT& funcsa, vecfuncT& funcsb,

                             double& xc)

     {

       for (unsigned int j = 0; j < phisa.size(); j++)

       {

         rfunctionT phi_j = real(phisa[j]);

         // do diagonal piece first

         rfunctionT dprod = phi_j*phi_j;

         dprod.truncate();

         rfunctionT dVex = apply(*_cop,dprod);

         functionT tf_jjj = dVex*phisa[j];

         funcsa[j] -= tf_jjj;

         xc -= real(inner(phisa[j],tf_jjj));

         for (unsigned int i = j+1; i < phisa.size(); i++)

         {

           rfunctionT phi_i = real(phisa[i]);

           rfunctionT prod = phi_i*phi_j;

           prod.truncate();

           rfunctionT Vex = apply(*_cop,prod);

           // do the jij-th term

           functionT tf_jij = Vex*phisa[j];

           funcsa[i] -= tf_jij;

           xc -= real(inner(phisa[i],tf_jij));

           // do the iji-th term (in the complex case, use the complex

           // conjugate)

           functionT tf_iji = Vex*phisa[i];

           funcsa[j] -= tf_iji;

           xc -= real(inner(phisa[j],tf_iji));

         }

       }

     }

     //*************************************************************************


     //*************************************************************************

     KPoint find_kpt_from_orb(unsigned int idx)

     {

       for (unsigned int i = 0; i < _kpoints.size(); i++)

       {

         KPoint k1 = _kpoints[i];

         if (k1.is_orb_in_kpoint(idx)) return k1;

       }

       MADNESS_EXCEPTION("Error: find_kpt_from_orb: didn't find kpoint\n", 0);

     }

     //************************************************************************


     // hf exchange with k-points for periodic solid

     //*************************************************************************

     void apply_hf_exchange4(vecfuncT& phisa, vecfuncT& phisb,

                            vecfuncT& funcsa, vecfuncT& funcsb,

                            double& xc)

     {

       for (unsigned int i = 0; i < phisa.size(); i++)

       {

         functionT phi_i = phisa[i];

         KPoint k_i = find_kpt_from_orb(i);

         for (unsigned int j = 0; j < phisa.size(); j++)

         {

           functionT phi_j = phisa[j];

           KPoint k_j = find_kpt_from_orb(j);

           Vector<double,3> q = vec((k_i.k[0]-k_j.k[0])*_params.L,

                                    (k_i.k[1]-k_j.k[1])*_params.L,

                                    (k_i.k[2]-k_j.k[2])*_params.L);

           Vector<double,3> q2 = vec(k_i.k[0]-k_j.k[0],

                                     k_i.k[1]-k_j.k[1],

                                     k_i.k[2]-k_j.k[2]);

           functionT cexp =

               factoryT(_world).functor(functorT(new

                   ComplexExp<3>(q2, double_complex(1.0,0.0))));

           functionT cexp2 = conj(cexp);

           cexp.truncate();

           cexp2.truncate();

           functionT prod = phi_i*phi_j*cexp;

           SeparatedConvolution<double_complex,3> hfexop =

               PeriodicHFExchangeOperator(_world, q, _params.lo,

                   FunctionDefaults<3>::get_thresh() * 0.1);

           functionT Vex = apply(hfexop,prod);

           functionT tf1 = Vex*phisa[j]*cexp2;

           funcsa[i] -= tf1;

           xc -= real(inner(phisa[i],tf1));

         }

       }

     }

     //*************************************************************************


     // not working and not tested .... supposed to be for the periodic boundary

     // conditions with k-points

     //*************************************************************************

     void apply_hf_exchange(vecfuncT& phisa, vecfuncT& phisb,

                            vecfuncT& funcsa, vecfuncT& funcsb)

     {

       for (unsigned int ink1 = 0, ik1 = 0; ink1 < _phisa.size(); ++ink1)

       {

         for (unsigned int ink2 = 0, ik2 = 0; ink2 <= ink1; ink2++)

         {

           KPoint k1 = _kpoints[ik1];

           KPoint k2 = _kpoints[ik2];


           if (ink1 == k1.end) ik1++;

           if (ink2 == k2.end) ik2++;


           MADNESS_ASSERT(ik1 == 0);

           MADNESS_ASSERT(ik2 == 0);


           // no phase factor

           if (ik1 == ik2)

           {

 //            // same state (diagonal piece)

 //            if (ink1 == ink2)

 //            {

 //              rfunctionT prod = abs_square(phisa[ink1]);

 //              rfunctionT fr = apply(*_cop,prod);

 //              funcsa[ink1] -= funcsa[ink1]*fr;

 //            }

 //            else

             {

               Vector<double,3> q = 0.0;

               functionT f = phisa[ink1]*conj(phisa[ink2]);

               SeparatedConvolution<double_complex,3> hfexop =

                   PeriodicHFExchangeOperator(_world, q, _params.lo, FunctionDefaults<3>::get_thresh() * 0.1);

               functionT fr = apply(hfexop,f);

               funcsa[ink1] -= funcsa[ink2]*fr;

               funcsa[ink2] -= funcsa[ink1]*conj(fr);


               // test code

               rfunctionT g1 = abs(phisa[ink1]);

               rfunctionT g2 = abs(phisa[ink2]);

               rfunctionT ff = g1*g2;


               printf("norm diff: %20.8f\n", abs(ff.norm2()-f.norm2()));

               MADNESS_ASSERT(abs(ff.norm2()-f.norm2()) <= 1e-5);

               rfunctionT fr2 = apply(*_cop,ff);

               MADNESS_ASSERT(abs(fr.norm2()-fr2.norm2()) <= 1e-5);

             }

           }

 //          else

 //          {

 //            Vector<double,3> q = VectorFactory(k1.k[0]-k2.k[0],

 //                                               k1.k[1]-k2.k[1],

 //                                               k1.k[2]-k2.k[2]);

 //            functionT cexp = factoryT(_world).functor(functorT(new ComplexExp<3>(q, double_complex(1.0,0.0))));

 //            cexp.truncate();

 //

 //            functionT f = phisa[ink1]*conj(phisa[ink2])*cexp;

 //            SeparatedConvolution<double_complex,3> hfexop =

 //                PeriodicHFExchangeOperator(_world, q, _params.lo, FunctionDefaults<3>::get_thresh() * 0.1);

 //            functionT fr = apply(hfexop,f);

 //            funcsa[ink1] -= phisa[ink1]*fr*conj(cexp);

 //            funcsa[ink2] -= phisa[ink2]*conj(fr)*cexp;

 //          }

         }

       }

     }

     //*************************************************************************


     //*************************************************************************

     void reproject()

     {

       _params.waveorder += 2;

       _params.thresh /= 100;

       FunctionDefaults<3>::set_thresh(_params.thresh);

       FunctionDefaults<3>::set_k(_params.waveorder);

       if (_world.rank() == 0) _outputF << "reprojecting to wavelet order "

           << _params.waveorder << endl;

       reconstruct(_world, _phisa);

       for(unsigned int i = 0; i < _phisa.size(); i++)

       {

         _phisa[i] = madness::project(_phisa[i], FunctionDefaults<3>::get_k(),

           FunctionDefaults<3>::get_thresh(), false);

       }

       _world.gop.fence();

       truncate(_world, _phisa);

       normalize(_world, _phisa);

       if(_params.spinpol)

       {

         reconstruct(_world, _phisb);

         for(unsigned int i = 0; i < _phisb.size(); i++)

         {

             _phisb[i] = madness::project(_phisb[i], FunctionDefaults<3>::get_k(),

               FunctionDefaults<3>::get_thresh(), false);

         }

         _world.gop.fence();

         truncate(_world, _phisb);

         normalize(_world, _phisb);

       }


       delete _cop;

       make_nuclear_potential();

       //_subspace->reproject();

       delete _subspace;

       _subspace = new Subspace<T,NDIM>(_world, _params);

     }

     //*************************************************************************


     //*************************************************************************

     void solve()

     {


       // WSTHORNTON (debug) Test periodicity

 //      if (_world.rank() == 0) printf("initial orbitals (periodicity) ...\n\n");

 //      for (unsigned int i = 0; i < _phisa.size(); i++)

 //      {

 //        if (_world.rank() == 0) printf("orbital %d\n",i);

 //        test_periodicity(_phisa[i]);

 //        if (_world.rank() == 0) printf("\n\n");

 //      }

 //      if (_world.rank() == 0) printf("\n\n\n\n");


       if (_world.rank() == 0) print("size of phisa is:  ", _phisa.size());

       // keep track of how many iterations have gone by without reprojecting

       int rit = 0;

       int rpthresh = 20;

       for (_it = 0; _it < _params.maxits && _residual > _params.rcriterion; _it++, rit++)

       {

         // should we reproject?

         if ((_it > 0) && ((_residual < 20*_params.thresh) || (rit == rpthresh)))

         {

           // reproject orbitals and reset threshold

           reproject();

           rit = 0;

         }


         if (_world.rank() == 0) _outputF << "_it = " << _it << endl;


         // Set occupation numbers

         set_occs2(_kpoints,_eigsa,_eigsb,_occsa,_occsb);


         // Compute density

         rfunctionT rhoa = compute_rho(_phisa, _kpoints, _occsa);

         rfunctionT rhob = (_params.spinpol) ? compute_rho(_phisb, _kpoints, _occsb) : rhoa;

 //        rfunctionT rhoa = _rhoa;

 //        rfunctionT rhob = _rhob;

         double drhoa = (_rhoa-rhoa).trace();

         double drhob = (_rhob-rhob).trace();

         if (_world.rank() == 0)

         {

           printf("diff of alpha rho: %15.7f\n",drhoa);

           printf("diff of beta rho: %15.7f\n",drhob);

         }


         _rho = rhoa + rhob;


         _rhoa = rhoa;

         _rhob = rhob;

         double rtrace = _rho.trace();

         if (_world.rank() == 0) _outputF << "trace of rho" << rtrace << endl;


 //        if(_it < 2 || (_it % 10) == 0)

 //        {

 //          START_TIMER(_world);

 //          //loadbal();

 //          END_TIMER(_world, "Load balancing");

 //        }


         std::vector<functionT> pfuncsa =

                 zero_functions<valueT,NDIM>(_world, _phisa.size());

         std::vector<functionT> pfuncsb =

                 zero_functions<valueT,NDIM>(_world, _phisb.size());


         // Apply the potentials to the orbitals

         if (_world.rank() == 0) _outputF << "applying potential ...\n" << endl;

         //START_TIMER(_world);

         apply_potential(pfuncsa, pfuncsb, _phisa, _phisb, _rhoa, _rhob, _rho);

         //END_TIMER(_world,"apply potential");


         // Do right hand side for all k-points

         std::vector<double> alpha(pfuncsa.size(), 0.0);

         do_rhs_simple(_phisa, pfuncsa, _kpoints, alpha, _eigsa);


         if (_params.plotorbs)

         {

           std::vector<long> npt(3,101);

           for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

           {

             KPoint kpoint = _kpoints[ik];

             int ist = 0;

             for (unsigned int kst = kpoint.begin; kst < kpoint.end; kst++, ist++)

             {

               std::ostringstream strm;

               strm << "pre_unk_" << ik << "_" << ist << ".dx";

               std::string fname = strm.str();

               plotdx(_phisa[kst], fname.c_str(), FunctionDefaults<3>::get_cell(), npt);

             }

           }

         }

         // WSTHORNTON

         // DEBUG

         if (_world.rank() == 0)

           printf("\n\n\n\n------ Debugging BSH operator -----");

         for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

         {

           KPoint kpoint = _kpoints[ik];

           std::vector<double> k_alpha(alpha.begin() + kpoint.begin, alpha.begin() + kpoint.end);

           if (_world.rank() == 0)

             printf("alpha: (%6.4f,%6.4f,%6.4f)\n",kpoint.k[0],kpoint.k[1],kpoint.k[2]);

           for (unsigned int ia = 0; ia < k_alpha.size(); ia++)

           {

             if (_world.rank() == 0) printf("%15.8f\n", k_alpha[ia]);

           }

         }

         if (_world.rank() == 0) printf("\n\n\n\n");


         // WSTHORNTON (debug)

         if (_world.rank() == 0) printf("before BSH application ...\n\n");

         for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

         {

           KPoint kpoint = _kpoints[ik];

           double k0 = kpoint.k[0];

           double k1 = kpoint.k[1];

           double k2 = kpoint.k[2];

           if (_world.rank() == 0)

             printf("(%6.5f, %6.5f, %6.5f)\n",k0,k1,k2);

           std::vector<functionT> k_phisa(_phisa.begin() + kpoint.begin, _phisa.begin() + kpoint.end);

           std::vector<functionT> k_pfuncsa(pfuncsa.begin() + kpoint.begin, pfuncsa.begin() + kpoint.end);

           KPoint kpoint_gamma;

           print_fock_matrix_eigs(k_phisa, k_pfuncsa, kpoint_gamma);


           // diagonalize overlap

           tensorT overlap = matrix_inner(_world,k_pfuncsa,k_pfuncsa,true);

           ctensorT co; rtensorT eo;

           syev(overlap, co, eo);


           if (_world.rank() == 0) printf("Overlap eigenvalues: \n");

           if (_world.rank() == 0) print(overlap);

           for (unsigned int ie = 0; ie < eo.dim(0); ie++)

           {

             if (_world.rank() == 0) printf("%d    %15.8e\n", ie, eo(ie,ie));

           }


         }

         if (_world.rank() == 0) printf("\n\n\n\n");


         // WSTHORNTON (debug) Test periodicity

 //        if (_world.rank() == 0) printf("before BSH application (periodicity) ...\n\n");

 //        for (unsigned int i = 0; i < _phisa.size(); i++)

 //        {

 //          if (_world.rank() == 0) printf("orbital %d\n",i);

 //          test_periodicity(_phisa[i]);

 //          if (_world.rank() == 0) printf("\n\n");

 //        }

 //        if (_world.rank() == 0) printf("\n\n\n\n");


         // Make BSH Green's function

         std::vector<poperatorT> bopsa = make_bsh_operators(alpha);

         std::vector<T> sfactor(pfuncsa.size(), -2.0);

         scale(_world, pfuncsa, sfactor);


         // Apply Green's function to orbitals

         if (_world.rank() == 0) std::cout << "applying BSH operator ...\n" << endl;

         truncate<valueT,NDIM>(_world, pfuncsa);

         START_TIMER(_world);

         std::vector<functionT> tmpa = apply(_world, bopsa, pfuncsa);

         END_TIMER(_world,"apply BSH");

         bopsa.clear();


         // WSTHORNTON

         // norms

         if (_world.rank() == 0) printf("norms of tmpa\n");

         std::vector<double> tmpa_norms = norm2s(_world, tmpa);

         for (unsigned int i = 0; i < tmpa_norms.size(); i++)

         {

           if (_world.rank() == 0) printf("%10d     %15.8f\n", i, tmpa_norms[i]);

         }

         if (_world.rank() == 0) printf("\n\n\n\n");


         // Do other spin

         vecfuncT tmpb = zero_functions<valueT,NDIM>(_world, _phisb.size());

         if (_params.spinpol)

         {

           alpha = std::vector<double>(_phisb.size(), 0.0);

           do_rhs_simple(_phisb, pfuncsb,  _kpoints, alpha, _eigsb);

           std::vector<poperatorT> bopsb = make_bsh_operators(alpha);

           scale(_world, pfuncsb, sfactor);

           truncate<valueT,NDIM>(_world, pfuncsb);

           tmpb = apply(_world, bopsb, pfuncsb);

           bopsb.clear();

         }

         else

         {

           for (unsigned int i = 0; i < _eigsa.size(); i++) _eigsb[i] = _eigsa[i];

         }


         // WSTHORNTON (debug)

         std::vector<functionT> pfuncsa2=

                 zero_functions<valueT,NDIM>(_world, _phisa.size());

         std::vector<functionT> pfuncsb2=

                 zero_functions<valueT,NDIM>(_world, _phisa.size());


         // Apply the potentials to the orbitals

         if (_world.rank() == 0) _outputF << "applying potential2 ...\n" << endl;

         apply_potential(pfuncsa2, pfuncsb2, tmpa, tmpb, _rhoa, _rhob, _rho);

         for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

         {

           KPoint kpoint = _kpoints[ik];

           double k0 = kpoint.k[0];

           double k1 = kpoint.k[1];

           double k2 = kpoint.k[2];

           if (_world.rank() == 0)

             printf("(%6.5f, %6.5f, %6.5f)\n",k0,k1,k2);

           std::vector<functionT> k_tmpa(tmpa.begin() + kpoint.begin, tmpa.begin() + kpoint.end);

           std::vector<functionT> k_pfuncsa2(pfuncsa2.begin() + kpoint.begin, pfuncsa2.begin() + kpoint.end);

           print_fock_matrix_eigs(k_tmpa, k_pfuncsa2, kpoint);


           // diagonalize overlap

 //          tensorT overlap = matrix_inner(_world,k_tmpa,k_tmpa,true);

 //          if (_world.rank() == 0) print(overlap);

 //          ctensorT co; rtensorT eo;

 //          syev(overlap, co, eo);

 //

 //          if (_world.rank() == 0) printf("Overlap eigenvalues: \n");

 //          for (unsigned int ie = 0; ie < eo.dim(0); ie++)

 //          {

 //            if (_world.rank() == 0) printf("%d    %15.8e\n", ie, eo(ie,ie));

 //          }

         }

         if (_world.rank() == 0) printf("\n\n\n\n");


         if (_world.rank() == 0) printf("\n\n\n\n");


         // Update orbitals

         update_orbitals(tmpa, tmpb, _kpoints);

         save_orbitals();


         // WSTHORNTON

         if (_world.rank() == 0) _outputF << "after update_orbitals() ...\n" << endl;

         pfuncsa2=zero_functions<valueT,NDIM>(_world, _phisa.size());

         pfuncsb2=zero_functions<valueT,NDIM>(_world, _phisa.size());

         apply_potential(pfuncsa2, pfuncsb2, _phisa, _phisb, _rhoa, _rhob, _rho);

         for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

         {

           KPoint kpoint = _kpoints[ik];

           double k0 = kpoint.k[0];

           double k1 = kpoint.k[1];

           double k2 = kpoint.k[2];

           if (_world.rank() == 0)

             printf("(%6.5f, %6.5f, %6.5f)\n",k0,k1,k2);

           std::vector<functionT> k_phisa(_phisa.begin() + kpoint.begin, _phisa.begin() + kpoint.end);

           std::vector<functionT> k_pfuncsa2(pfuncsa2.begin() + kpoint.begin, pfuncsa2.begin() + kpoint.end);

           print_fock_matrix_eigs(k_phisa, k_pfuncsa2, kpoint);

         }

         if (_world.rank() == 0) printf("\n\n\n\n");


       }


       if (_params.plotorbs)

       {

         std::vector<long> npt(3,101);

         for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

         {

           KPoint kpoint = _kpoints[ik];

           int ist = 0;

           for (unsigned int kst = kpoint.begin; kst < kpoint.end; kst++, ist++)

           {

             std::ostringstream strm;

             strm << "unk_" << ik << "_" << ist << ".dx";

             std::string fname = strm.str();

             plotdx(_phisa[kst], fname.c_str(), FunctionDefaults<3>::get_cell(), npt);

           }

         }

       }

       save_orbitals();

     }

     //*************************************************************************


     //*************************************************************************

     ctensorT matrix_exponential(const ctensorT& A) {

         const double tol = 1e-13;

         MADNESS_ASSERT(A.dim(0) == A.dim(1));


         // Scale A by a power of 2 until it is "small"

         double anorm = A.normf();

         int n = 0;

         double scale = 1.0;

         while (anorm*scale > 0.1)

         {

             n++;

             scale *= 0.5;

         }

         tensorT B = scale*A;    // B = A*2^-n


         // Compute exp(B) using Taylor series

         ctensorT expB = ctensorT(2, B.dims());

         for (int i = 0; i < expB.dim(0); i++) expB(i,i) = std::complex<T>(1.0,0.0);


         int k = 1;

         ctensorT term = B;

         while (term.normf() > tol)

         {

             expB += term;

             term = inner(term,B);

             k++;

             term.scale(1.0/k);

         }


         // Repeatedly square to recover exp(A)

         while (n--)

         {

             expB = inner(expB,expB);

         }


         return expB;

     }

     //*************************************************************************


     //*************************************************************************

     template<typename Q>

     void print_tensor2d(ostream& os, Tensor<Q> t)

     {

       os.precision(5);

       for (int i = 0; i < t.dim(0); i++)

       {

         for (int j = 0; j < t.dim(1); j++)

         {

           os << t(i,j) << setw(12);

         }

         os << endl;

       }

       os << endl;

     }

     //*************************************************************************


     //*************************************************************************

     void print_potential_matrix_eigs(const vecfuncT& wf, const vecfuncT& vwf)

     {

       // Build the potential matrix

       START_TIMER(_world);

       tensorT potential = matrix_inner(_world, wf, vwf, true);

       _world.gop.fence();

       END_TIMER(_world,"potential energy matrix");

       if (_world.rank()==0) printf("\n");

       tensorT overlap = matrix_inner(_world,wf,wf,true);

       _world.gop.fence();


       // diagonalize potential

       ctensorT cp; rtensorT ep;

       sygv(potential, overlap, 1, cp, ep);

       if (_world.rank() == 0)

       {

         print("potential eigenvectors dims:",cp.dim(0),cp.dim(1));

         print("potential eigenvectors:");

         print(cp);

         printf("\n\n");

         print("potential eigenvalues:");

         print(ep);

         printf("\n\n");

       }


     }

     //*************************************************************************


     //*************************************************************************

     void print_fock_matrix_eigs(const vecfuncT& wf, const vecfuncT& vwf, KPoint kpoint)

     {

       // Build the potential matrix

       START_TIMER(_world);

       tensorT potential = matrix_inner(_world, wf, vwf, true);

       _world.gop.fence();

       END_TIMER(_world,"potential energy matrix");

       if (_world.rank()==0) printf("\n");


       START_TIMER(_world);

       if (_world.rank() == 0) _outputF << "Building kinetic energy matrix ...\n\n" << endl;

         //tensorT kinetic = ::kinetic_energy_matrix_slow<T,NDIM>(_world, psi,

         //                                          _params.periodic,

         //                                          kpoint);

         tensorT kinetic = ::kinetic_energy_matrix<T,NDIM>(_world, wf,

                                                   _params.periodic,

                                                   kpoint);

       _world.gop.fence();

       END_TIMER(_world,"kinetic energy matrix");

       if (_world.rank() == 0) printf("\n");


       if (_world.rank() == 0) _outputF << "Constructing Fock matrix ...\n\n" << endl;

       tensorT fock = potential + kinetic;

       fock = 0.5 * (fock + conj_transpose(fock));

       _world.gop.fence();


       // DEBUG

       tensorT overlap = matrix_inner(_world,wf,wf,true);

       _world.gop.fence();


       // diagonlize kinetic

       ctensorT ck; rtensorT ek;

       sygv(kinetic, overlap, 1, ck, ek);

       // diagonalize potential

       ctensorT cp; rtensorT ep;

       sygv(potential, overlap, 1, cp, ep);

       // diagonalize overlap

       ctensorT co; rtensorT eo;

       syev(overlap, co, eo);

       ctensorT c; rtensorT e;

       sygv(fock, overlap, 1, c, e);


       if (_world.rank() == 0)

       {

         print("kinetic matrix:");

         print(kinetic);

         print("\nkinetic eigenvalues:");

         print(ek);

         print("\n");


         print("potential matrix:");

         print(potential);

         print("\npotential eigenvalues:");

         print(ep);

         print("\n");


         print("fock matrix:");

         print(fock);

         print("\nfock eigenvalues:");

         print(e);

         print("\n");

       }


     }

     //*************************************************************************


     //*************************************************************************

     void do_rhs(vecfuncT& wf,

                 vecfuncT& vwf,

                 std::vector<KPoint> kpoints,

                 std::vector<T>& alpha,

                 std::vector<double>& eigs)

     {

       // tolerance

       double trantol = 0.1*_params.thresh/std::min(30.0,double(wf.size()));

       double thresh = 1e-4;


       if (_world.rank() == 0) _eigF << "Iteration: " << _it << endl;

       for (unsigned int kp = 0; kp < kpoints.size(); kp++)

       {

         // Get k-point and orbitals for this k-point

         KPoint kpoint = kpoints[kp];

         double k0 = kpoint.k[0];

         double k1 = kpoint.k[1];

         double k2 = kpoint.k[2];

         // Extract the relevant portion of the list of orbitals and the list of the

         // V times the orbitals

         vecfuncT k_wf(wf.begin() + kpoint.begin, wf.begin() + kpoint.end);

         vecfuncT k_vwf(vwf.begin() + kpoint.begin, vwf.begin() + kpoint.end);

         // Build fock matrix

         tensorT fock = build_fock_matrix(k_wf, k_vwf, kpoint);

         tensorT overlap = matrix_inner(_world, k_wf, k_wf, true);


 //        // Do right hand side stuff for kpoint

 //        bool isgamma = (is_equal(k0,0.0,1e-5) &&

 //                        is_equal(k1,0.0,1e-5) &&

 //                        is_equal(k2,0.0,1e-5));

 //        if (_params.periodic && !isgamma) // Non-zero k-point

 //        {

 //          // Do the gradient term and k^2/2

 //          vecfuncT d_wf = zero_functions<valueT,NDIM>(_world, k_wf.size());

 //          complex_derivative_3d Dx(_world,0);

 //          complex_derivative_3d Dy(_world,1);

 //          complex_derivative_3d Dz(_world,2);

 //          for (unsigned int i = 0; i < k_wf.size(); i++)

 //          {

 //            // gradient

 //            functionT dx_wf = Dx(k_wf[i]);

 //            functionT dy_wf = Dy(k_wf[i]);

 //            functionT dz_wf = Dz(k_wf[i]);

 //            d_wf[i] = std::complex<T>(0.0,k0)*dx_wf +

 //                      std::complex<T>(0.0,k1)*dy_wf +

 //                      std::complex<T>(0.0,k2)*dz_wf;

 //            // k^/2

 //            double ksq = k0*k0 + k1*k1 + k2*k2;

 //            k_vwf[i] += 0.5 * ksq * k_wf[i];

 //            k_vwf[i] -= d_wf[i];

 //          }

 //        }


         if (_params.canon) // canonical orbitals

         {

           ctensorT U; rtensorT e;

           sygv(fock, overlap, 1, U, e);


           unsigned int nmo = k_wf.size();

           // Fix phases.

           long imax;

           for (long j = 0; j < nmo; j++)

           {

               // Get index of largest value in column

               U(_,j).absmax(&imax);

               T ang = arg(U(imax,j));

               std::complex<T> phase = exp(std::complex<T>(0.0,-ang));

               // Loop through the rest of the column and divide by the phase

               for (long i = 0; i < nmo; i++)

               {

                 U(i,j) *= phase;

               }

           }


           // Within blocks with the same occupation number attempt to

           // keep orbitals in the same order (to avoid confusing the

           // non-linear solver).  Have to run the reordering multiple

           // times to handle multiple degeneracies.

           int maxpass = 5;

           for (int pass = 0; pass < maxpass; pass++)

           {

               long j;

               for (long i = 0; i < nmo; i++)

               {

                 U(_, i).absmax(&j);

                 if (i != j)

                 {

                   tensorT tmp = copy(U(_, i));

                   U(_, i) = U(_, j);

                   U(_, j) = tmp;

                   //swap(e[i], e[j]);

                   T ti = e[i];

                   T tj = e[j];

                   e[i] = tj; e[j] = ti;

                 }

               }

           }


           // Rotations between effectively degenerate states confound

           // the non-linear equation solver ... undo these rotations

           long ilo = 0; // first element of cluster

           while (ilo < nmo-1) {

               long ihi = ilo;

               while (fabs(real(e[ilo]-e[ihi+1])) < thresh*10.0*max(fabs(real(e[ilo])),1.0)) {

                   ihi++;

                   if (ihi == nmo-1) break;

               }

               long nclus = ihi - ilo + 1;

               if (nclus > 1) {

                   if (_world.rank() == 0) print("   found cluster", ilo, ihi);

                   tensorT q = copy(U(Slice(ilo,ihi),Slice(ilo,ihi)));

                   //print(q);

                   // Special code just for nclus=2

                   // double c = 0.5*(q(0,0) + q(1,1));

                   // double s = 0.5*(q(0,1) - q(1,0));

                   // double r = sqrt(c*c + s*s);

                   // c /= r;

                   // s /= r;

                   // q(0,0) = q(1,1) = c;

                   // q(0,1) = -s;

                   // q(1,0) = s;


                   // Iteratively construct unitary rotation by

                   // exponentiating the antisymmetric part of the matrix

                   // ... is quadratically convergent so just do 3

                   // iterations

                   ctensorT rot = matrix_exponential(-0.5*(q - conj_transpose(q)));

                   q = inner(q,rot);

                   ctensorT rot2 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                   q = inner(q,rot2);

                   ctensorT rot3 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                   q = inner(rot,inner(rot2,rot3));

                   U(_,Slice(ilo,ihi)) = inner(U(_,Slice(ilo,ihi)),q);

               }

               ilo = ihi+1;

           }


           // Debug output

           if (_params.print_matrices && _world.rank() == 0)

           {

               printf("(%10.5f, %10.5f, %10.5f)\n", k0, k1, k2);

               print("Overlap matrix:");

               print(overlap);


               print("Fock matrix:");

               print(fock);


               print("U matrix: (eigenvectors)");

               print(U);


               print("Fock matrix eigenvalues:");

               print(e);

           }


           // WSTHORNTON

           //print_fock_matrix_eigs(k_wf, k_vwf, kpoint);


           // transform orbitals and V * (orbitals)

           //k_vwf = transform(_world, k_vwf, U, 1e-5 / std::min(30.0, double(k_wf.size())), false);

           //k_wf = transform(_world, k_wf, U, FunctionDefaults<3>::get_thresh() / std::min(30.0, double(k_wf.size())), true);


           // WSTHORNTON

           //print_fock_matrix_eigs(k_wf, k_vwf, kpoint);


           // Do right hand side stuff for kpoint

           bool isgamma = (is_equal(k0,0.0,1e-5) &&

                           is_equal(k1,0.0,1e-5) &&

                           is_equal(k2,0.0,1e-5));

           if (_params.periodic && !isgamma) // Non-zero k-point

           {

             // Do the gradient term and k^2/2

             vecfuncT d_wf = zero_functions<valueT,NDIM>(_world, k_wf.size());

             complex_derivative_3d Dx(_world,0);

             complex_derivative_3d Dy(_world,1);

             complex_derivative_3d Dz(_world,2);

             for (unsigned int i = 0; i < k_wf.size(); i++)

             {

               // gradient

               functionT dx_wf = Dx(k_wf[i]);

               functionT dy_wf = Dy(k_wf[i]);

               functionT dz_wf = Dz(k_wf[i]);

               d_wf[i] = std::complex<T>(0.0,k0)*dx_wf +

                         std::complex<T>(0.0,k1)*dy_wf +

                         std::complex<T>(0.0,k2)*dz_wf;

               // k^/2

               double ksq = k0*k0 + k1*k1 + k2*k2;

               k_vwf[i] += 0.5 * ksq * k_wf[i];

               k_vwf[i] -= d_wf[i];

             }

           }


           // WSTHORNTON (new code)

           unsigned int eimax = -1;

           double eimaxval = -1e10;

           for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

             ei++, fi++)

           {

             if ((real(e(fi,fi)) > 0.0) && (real(e(fi,fi)) > eimaxval))

             {

               eimax = fi;

               eimaxval = real(e(fi,fi));

             }

           }


           double eshift = (eimaxval > 0.0) ? eimaxval + 0.1 : 0.0;

           for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

             ei++, fi++)

           {

             // Save the latest eigenvalues

             eigs[ei] = real(e(fi,fi));

             alpha[ei] = e(fi,fi)-eshift;

             k_vwf[fi] += (alpha[ei]-eigs[ei])*k_wf[fi];

           }


           if (_world.rank() == 0)

           {

             _eigF << "kpt: " << kp << endl;

             _eigF << setfill('-') << setw(20) << " " << endl;

             for (unsigned int ei = kpoint.begin; ei < kpoint.end; ei++)

             {

               char eigstr[50];

               printf("%3d%15.10f",ei,real(eigs[ei]));

 //              _eigF << ei << setfill(' ') << setw(12) << real(eigs[ei]) << endl;

               _eigF << eigstr << endl;

             }

             _eigF << "\n\n" << endl;

           }

         }

         else // non-canonical orbitals

         {

           // diagonlize just to print eigenvalues

           tensorT overlap = matrix_inner(_world, k_wf, k_wf, true);

           ctensorT c; rtensorT e;

           sygv(fock, overlap, 1, c, e);

           for (unsigned int ei = 0; ei < e.dim(0); ei++)

           {

             double diffe = (ei == 0) ? 0.0 : real(e(ei,ei))-real(e(ei-1,ei-1));

             if (_world.rank() == 0)

               print("kpoint ", kp, "ei ", ei, "eps ", real(e(ei,ei)), "\tdiff\t", diffe);

           }


           for (unsigned int ei = kpoint.begin, fi = 0;

             ei < kpoint.end; ei++, fi++)

           {

             alpha[ei] = std::min(-0.1, real(fock(fi,fi)));

             fock(fi,fi) -= std::complex<T>(alpha[ei], 0.0);

           }


           std::vector<functionT> fwf = transform(_world, k_wf, fock, trantol);

           gaxpy(_world, 1.0, k_vwf, -1.0, fwf);

           fwf.clear();

         }

         for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

           wi++, fi++)

         {

           wf[wi] = k_wf[fi];

           vwf[wi] = k_vwf[fi];

         }

       }

     }

     //*************************************************************************


     //*************************************************************************

     void do_rhs_simple(vecfuncT& wf,

                 vecfuncT& vwf,

                 std::vector<KPoint> kpoints,

                 std::vector<T>& alpha,

                 std::vector<double>& eigs)

     {

       // tolerance

       double trantol = 0.1*_params.thresh/std::min(30.0,double(wf.size()));

       double thresh = 1e-4;


       if (_world.rank() == 0) _eigF << "Iteration: " << _it << endl;

       for (unsigned int kp = 0; kp < kpoints.size(); kp++)

       {

         // Get k-point and orbitals for this k-point

         KPoint kpoint = kpoints[kp];

         double k0 = kpoint.k[0];

         double k1 = kpoint.k[1];

         double k2 = kpoint.k[2];

         // Extract the relevant portion of the list of orbitals and the list of the

         // V times the orbitals

         vecfuncT k_wf(wf.begin() + kpoint.begin, wf.begin() + kpoint.end);

         vecfuncT k_vwf(vwf.begin() + kpoint.begin, vwf.begin() + kpoint.end);


         // Build fock matrix

         tensorT fock = build_fock_matrix(k_wf, k_vwf, kpoint);

         tensorT overlap = matrix_inner(_world, k_wf, k_wf, true);

         for (unsigned int i = 0; i < k_wf.size(); i++)

           fock(i,i) += std::complex<double>(i*_params.thresh*0.1,0.0);


         ctensorT U; rtensorT e;

         sygv(fock, overlap, 1, U, e);


         if (_params.print_matrices && _world.rank() == 0)

         {

             printf("(%10.5f, %10.5f, %10.5f)\n", k0, k1, k2);

             print("Overlap matrix:");

             print(overlap);


             print("Fock matrix:");

             print(fock);


             print("U matrix: (eigenvectors)");

             print(U);


             print("Fock matrix eigenvalues:");

             print(e);

         }


         // this is all of the B.S. for the solver

         if (_params.solver == 1)

         {

           unsigned int nmo = k_wf.size();

           // Fix phases.

           long imax;

           for (long j = 0; j < nmo; j++)

           {

               // Get index of largest value in column

               U(_,j).absmax(&imax);

               T ang = arg(U(imax,j));

               std::complex<T> phase = exp(std::complex<T>(0.0,-ang));

               // Loop through the rest of the column and divide by the phase

               for (long i = 0; i < nmo; i++)

               {

                 U(i,j) *= phase;

               }

           }


           // Within blocks with the same occupation number attempt to

           // keep orbitals in the same order (to avoid confusing the

           // non-linear solver).  Have to run the reordering multiple

           // times to handle multiple degeneracies.

           int maxpass = 5;

           for (int pass = 0; pass < maxpass; pass++)

           {

               long j;

               for (long i = 0; i < nmo; i++)

               {

                 U(_, i).absmax(&j);

                 if (i != j)

                 {

                   tensorT tmp = copy(U(_, i));

                   U(_, i) = U(_, j);

                   U(_, j) = tmp;

                   //swap(e[i], e[j]);

                   T ti = e[i];

                   T tj = e[j];

                   e[i] = tj; e[j] = ti;

                 }

               }

           }


           // Rotations between effectively degenerate states confound

           // the non-linear equation solver ... undo these rotations

           long ilo = 0; // first element of cluster

           while (ilo < nmo-1) {

               long ihi = ilo;

               while (fabs(real(e[ilo]-e[ihi+1])) < thresh*10.0*max(fabs(real(e[ilo])),1.0)) {

                   ihi++;

                   if (ihi == nmo-1) break;

               }

               long nclus = ihi - ilo + 1;

               if (nclus > 1) {

                   if (_world.rank() == 0) print("   found cluster", ilo, ihi);

                   tensorT q = copy(U(Slice(ilo,ihi),Slice(ilo,ihi)));

                   //print(q);

                   // Special code just for nclus=2

                   // double c = 0.5*(q(0,0) + q(1,1));

                   // double s = 0.5*(q(0,1) - q(1,0));

                   // double r = sqrt(c*c + s*s);

                   // c /= r;

                   // s /= r;

                   // q(0,0) = q(1,1) = c;

                   // q(0,1) = -s;

                   // q(1,0) = s;


                   // Iteratively construct unitary rotation by

                   // exponentiating the antisymmetric part of the matrix

                   // ... is quadratically convergent so just do 3

                   // iterations

                   ctensorT rot = matrix_exponential(-0.5*(q - conj_transpose(q)));

                   q = inner(q,rot);

                   ctensorT rot2 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                   q = inner(q,rot2);

                   ctensorT rot3 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                   q = inner(rot,inner(rot2,rot3));

                   U(_,Slice(ilo,ihi)) = inner(U(_,Slice(ilo,ihi)),q);

               }

               ilo = ihi+1;

           }

         }


         // transform orbitals and V * (orbitals)

         k_vwf = transform(_world, k_vwf, U, 1e-5 / std::min(30.0, double(k_wf.size())), false);

         k_wf = transform(_world, k_wf, U, FunctionDefaults<3>::get_thresh() / std::min(30.0, double(k_wf.size())), true);


         // Do right hand side stuff for kpoint

         bool isgamma = (is_equal(k0,0.0,1e-5) &&

                         is_equal(k1,0.0,1e-5) &&

                         is_equal(k2,0.0,1e-5));

         if (_params.periodic && !isgamma) // Non-zero k-point

         {

           // Do the gradient term and k^2/2

           vecfuncT d_wf = zero_functions<valueT,NDIM>(_world, k_wf.size());

           complex_derivative_3d Dx(_world,0);

           complex_derivative_3d Dy(_world,1);

           complex_derivative_3d Dz(_world,2);

           for (unsigned int i = 0; i < k_wf.size(); i++)

           {

             // gradient

             functionT dx_wf = Dx(k_wf[i]);

             functionT dy_wf = Dy(k_wf[i]);

             functionT dz_wf = Dz(k_wf[i]);


             // WSTHORNTON

 //            double delxx = std::abs(inner(k_wf[i],Dx(Dx(k_wf[i]))));

 //            double delyy = std::abs(inner(k_wf[i],Dy(Dy(k_wf[i]))));

 //            double delzz = std::abs(inner(k_wf[i],Dz(Dz(k_wf[i]))));


 //            if (_world.rank() == 0)

 //              printf("orb %2.2d  delxx:  %15.8e  delyy:  %15.8e  delzz:  %15.8e\n",i, delxx, delyy, delzz);


             // WSTHORNTON

 //            std::vector<long> npt(3,101);

 //            char fnamedx[50];

 //            sprintf(fnamedx, "xorb%2.2d__.dx",i);

 //            plotdx(k_wf[i], fnamedx, FunctionDefaults<3>::get_cell(), npt);

 //

 //            char fnamedx_dx[50];

 //            sprintf(fnamedx_dx, "xorb%2.2d__dx.dx",i);

 //            plotdx(dx_wf, fnamedx_dx, FunctionDefaults<3>::get_cell(), npt);

 //            char fnamedx_dy[50];

 //            sprintf(fnamedx_dy, "xorb%2.2d__dy.dx",i);

 //            plotdx(dy_wf, fnamedx_dy, FunctionDefaults<3>::get_cell(), npt);

 //            char fnamedx_dz[50];

 //            sprintf(fnamedx_dz, "xorb%2.2d__dz.dx",i);

 //            plotdx(dz_wf, fnamedx_dz, FunctionDefaults<3>::get_cell(), npt);

 //

 //            rfunctionT xfunc = rfactoryT(_world).functor(

 //              rfunctorT(new DipoleFunctor(0))).

 //                thresh(_params.thresh).truncate_on_project();

 //            rfunctionT yfunc = rfactoryT(_world).functor(

 //              rfunctorT(new DipoleFunctor(1))).

 //                thresh(_params.thresh).truncate_on_project();

 //            rfunctionT zfunc = rfactoryT(_world).functor(

 //              rfunctorT(new DipoleFunctor(2))).

 //                thresh(_params.thresh).truncate_on_project();

 //

 //            double xdip = std::abs(inner(k_wf[i],xfunc*k_wf[i]));

 //            double ydip = std::abs(inner(k_wf[i],yfunc*k_wf[i]));

 //            double zdip = std::abs(inner(k_wf[i],zfunc*k_wf[i]));

 //

 //            if (_world.rank() == 0)

 //              printf("orb: %1d     dipole moment: (%7.5e,%7.5e,%7.5e)\n",i,xdip,ydip,zdip);

 //

 //            double xdip1 = std::real(inner(k_wf[i],xfunc*k_wf[i]));

 //            double ydip1 = std::real(inner(k_wf[i],yfunc*k_wf[i]));

 //            double zdip1 = std::real(inner(k_wf[i],zfunc*k_wf[i]));

 //

 //            if (_world.rank() == 0)

 //              printf("orb: %1d     dipole moment: (%7.5e,%7.5e,%7.5e)\n",i,xdip1,ydip1,zdip1);

 //

 //            double xdip2 = std::imag(inner(k_wf[i],xfunc*k_wf[i]));

 //            double ydip2 = std::imag(inner(k_wf[i],yfunc*k_wf[i]));

 //            double zdip2 = std::imag(inner(k_wf[i],zfunc*k_wf[i]));

 //

 //            if (_world.rank() == 0)

 //              printf("orb: %1d     dipole moment: (%7.5e,%7.5e,%7.5e)\n\n\n",i,xdip2,ydip2,zdip2);

 //

 //            // WSTHORNTON

 //            char fname_x[50];

 //            char fname_y[50];

 //            char fname_z[50];

 //

 //            char fnamex_x[50];

 //            char fnamex_y[50];

 //            char fnamex_z[50];

 //

 //            char fnamey_x[50];

 //            char fnamey_y[50];

 //            char fnamey_z[50];

 //

 //            char fnamez_x[50];

 //            char fnamez_y[50];

 //            char fnamez_z[50];

 //

 //            sprintf(fname_x, "orb%2.2d__x.dat",i);

 //            sprintf(fname_y, "orb%2.2d__y.dat",i);

 //            sprintf(fname_z, "orb%2.2d__z.dat",i);

 //

 //            sprintf(fnamex_x, "orb%2.2d_dx_x.dat",i);

 //            sprintf(fnamex_y, "orb%2.2d_dx_y.dat",i);

 //            sprintf(fnamex_z, "orb%2.2d_dx_z.dat",i);

 //

 //            sprintf(fnamey_x, "orb%2.2d_dy_x.dat",i);

 //            sprintf(fnamey_y, "orb%2.2d_dy_y.dat",i);

 //            sprintf(fnamey_z, "orb%2.2d_dy_z.dat",i);

 //

 //            sprintf(fnamez_x, "orb%2.2d_dz_x.dat",i);

 //            sprintf(fnamez_y, "orb%2.2d_dz_y.dat",i);

 //            sprintf(fnamez_z, "orb%2.2d_dz_z.dat",i);

 //

 //            coord_3d pt1x = vec(-_params.L/2,0.0,0.0);

 //            coord_3d pt2x = vec( _params.L/2,0.0,0.0);

 //

 //            coord_3d pt1y = vec(0.0,-_params.L/2,0.0);

 //            coord_3d pt2y = vec(0.0, _params.L/2,0.0);

 //

 //            coord_3d pt1z = vec(0.0,0.0,-_params.L/2);

 //            coord_3d pt2z = vec(0.0,0.0, _params.L/2);

 //

 //            plot_line(fname_x,30000,pt1x,pt2x,k_wf[i]);

 //            plot_line(fname_y,30000,pt1y,pt2y,k_wf[i]);

 //            plot_line(fname_z,30000,pt1z,pt2z,k_wf[i]);

 //

 //            plot_line(fnamex_x,30000,pt1x,pt2x,dx_wf);

 //            plot_line(fnamex_y,30000,pt1y,pt2y,dx_wf);

 //            plot_line(fnamex_z,30000,pt1z,pt2z,dx_wf);

 //

 //            plot_line(fnamey_x,30000,pt1x,pt2x,dy_wf);

 //            plot_line(fnamey_y,30000,pt1y,pt2y,dy_wf);

 //            plot_line(fnamey_z,30000,pt1z,pt2z,dy_wf);

 //

 //            plot_line(fnamez_x,30000,pt1x,pt2x,dz_wf);

 //            plot_line(fnamez_y,30000,pt1y,pt2y,dz_wf);

 //            plot_line(fnamez_z,30000,pt1z,pt2z,dz_wf);


             d_wf[i] = std::complex<T>(0.0,k0)*dx_wf +

                       std::complex<T>(0.0,k1)*dy_wf +

                       std::complex<T>(0.0,k2)*dz_wf;

             // k^/2

             double ksq = k0*k0 + k1*k1 + k2*k2;

             k_vwf[i] += 0.5 * ksq * k_wf[i];

             k_vwf[i] -= d_wf[i];

           }

         }


         // WSTHORNTON (new code)

         unsigned int eimax = -1;

         double eimaxval = -1e10;

         for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

           ei++, fi++)

         {

           if ((real(e(fi,fi)) > 0.0) && (real(e(fi,fi)) > eimaxval))

           {

             eimax = fi;

             eimaxval = real(e(fi,fi));

           }

         }


         double eshift = (eimaxval > 0.0) ? eimaxval + 0.1 : 0.0;

         for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

           ei++, fi++)

         {

           // Save the latest eigenvalues

           eigs[ei] = real(e(fi,fi));

           alpha[ei] = e(fi,fi)-eshift;

           k_vwf[fi] += (alpha[ei]-eigs[ei])*k_wf[fi];

         }


 //        if (_world.rank() == 0) printf("do_rhs_simple: (3) ...\n\n");

 //        print_fock_matrix_eigs(k_wf, k_vwf, kpoint_gamma);


         if (_world.rank() == 0)

         {

           _eigF << "kpt: " << kp << endl;

           _eigF << setfill('-') << setw(20) << " " << endl;

           for (unsigned int ei = kpoint.begin; ei < kpoint.end; ei++)

           {

             char eigstr[50];

             sprintf(eigstr,"%3d%15.10f",ei,real(eigs[ei]));

             _eigF << eigstr << endl;

           }

           _eigF << "\n\n" << endl;

         }

         for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

           wi++, fi++)

         {

           wf[wi] = k_wf[fi];

           vwf[wi] = k_vwf[fi];

         }

       }

     }

     //*************************************************************************


     //*************************************************************************

     tensor_complex make_kinetic_matrix(World& world, const vector_complex_function_3d& v, const KPoint& k) {

         const double_complex I = double_complex(0.0,1.0);

         double kx = k.k[0];

         double ky = k.k[1];

         double kz = k.k[2];


         complex_derivative_3d Dx(world, 0);

         complex_derivative_3d Dy(world, 1);

         complex_derivative_3d Dz(world, 2);


         vector_complex_function_3d dvx = apply(world, Dx, v);

         vector_complex_function_3d dvy = apply(world, Dy, v);

         vector_complex_function_3d dvz = apply(world, Dz, v);


         // -1/2 (del + ik)^2 = -1/2 del^2 - i k.del + 1/2 k^2

         // -1/2 <p|del^2|q> = +1/2 <del p | del q>


         tensor_complex f1 = 0.5 * (matrix_inner(world, dvx, dvx, true) +

                                    matrix_inner(world, dvy, dvy, true) +

                                    matrix_inner(world, dvz, dvz, true));


         tensor_complex f2 =

             (-I*kx)*matrix_inner(world, v, dvx, false) +

             (-I*ky)*matrix_inner(world, v, dvy, false) +

             (-I*kz)*matrix_inner(world, v, dvz, false);


         tensor_complex f3 = (0.5 * (kx*kx + ky*ky + kz*kz)) * matrix_inner(world, v, v, true);


         return f1 + f2 + f3;

     }

     //*************************************************************************


     //*************************************************************************

     tensorT build_fock_matrix(vecfuncT& psi,

                               vecfuncT& vpsi,

                               KPoint kpoint)

     {

       // Build the potential matrix

       START_TIMER(_world);

       tensorT potential = matrix_inner(_world, psi, vpsi, true);

       _world.gop.fence();

       END_TIMER(_world,"potential energy matrix");

       if (_world.rank()==0) printf("\n");


       START_TIMER(_world);

       if (_world.rank() == 0) _outputF << "Building kinetic energy matrix ...\n\n" << endl;

         tensorT kinetic = ::kinetic_energy_matrix<T,NDIM>(_world, psi,

                                                   _params.periodic,

                                                   kpoint);

       tensorT kinetic2 = make_kinetic_matrix(_world, psi, kpoint);

       _world.gop.fence();

       END_TIMER(_world,"kinetic energy matrix");

       if (_world.rank() == 0) printf("\n");


       if (_world.rank() == 0) _outputF << "Constructing Fock matrix ...\n\n" << endl;

       tensorT fock = potential + kinetic;

       fock = 0.5 * (fock + conj_transpose(fock));

       _world.gop.fence();


       if (_world.rank() == 0)

       {

         print("KINETIC:");

         print(kinetic);

         print("KINETIC2:");

         print(kinetic2);

         print("POTENTIAL:");

         print(potential);

         print("FOCK:");

         print(fock);

       }


       return fock;

     }

     //*************************************************************************


     //*************************************************************************

     void gram_schmidt(vecfuncT& f, KPoint kpoint)

     {

       for (unsigned int fi = kpoint.begin; fi < kpoint.end; ++fi)

       {

         // Project out the lower states

         for (unsigned int fj = kpoint.begin; fj < fi; ++fj)

         {

           valueT overlap = inner(f[fj], f[fi]);

           f[fi] -= overlap*f[fj];

         }

         f[fi].scale(1.0/f[fi].norm2());

       }

     }

     //*************************************************************************


     //*************************************************************************

     tensorT Q3(const tensorT& s) {

         tensorT Q = inner(s,s);

         Q.gaxpy(0.2,s,-2.0/3.0);

         for (int i=0; i<s.dim(0); ++i) Q(i,i) += 1.0;

         return Q.scale(15.0/8.0);

     }

     //*************************************************************************


     //*************************************************************************

     ctensorT csqrt(const ctensorT& s, double tol=1e-8) {

         int n=s.dim(0), m=s.dim(1);

         MADNESS_ASSERT(n==m);

         ctensorT c; rtensorT e;

         //s.gaxpy(0.5,conj_transpose(s),0.5); // Ensure exact symmetry

         syev(s, c, e);

         for (int i=0; i<n; ++i) {

             if (e(i) < -tol) {

                 MADNESS_EXCEPTION("Matrix square root: negative eigenvalue",i);

             }

             else if (e(i) < tol) { // Ugh ..

                 print("Matrix square root: Warning: small eigenvalue ", i, e(i));

                 e(i) = tol;

             }

             e(i) = 1.0/sqrt(e(i));

         }

         for (int j=0; j<n; ++j) {

             for (int i=0; i<n; ++i) {

                 c(j,i) *= e(i);

             }

         }

         return c;

     }

     //*************************************************************************


     //*************************************************************************

     void orthonormalize(vecfuncT& wf, KPoint kpoint)

     {

       // extract k-point orbitals

       vecfuncT k_wf(wf.begin() + kpoint.begin, wf.begin() + kpoint.end);

       ctensorT S = matrix_inner(_world,k_wf,k_wf,true);

       printf("orthonormalize: \n");

       printf("before matrix (after): \n");

       print(S);

       ctensorT U = csqrt(S);

       k_wf = transform(_world, k_wf, U, _params.thresh, true);


       ctensorT S2 = matrix_inner(_world,k_wf,k_wf,true);

       printf("overlap matrix (after): \n");

       print(S2);

       for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

         wi++, fi++)

       {

         wf[wi] = k_wf[fi];

       }

     }

     //*************************************************************************


     //*************************************************************************

     vecfuncT compute_residual(const vecfuncT& awfs,

                               const vecfuncT& bwfs)

     {

       // vector of residual functions

       vecfuncT rm = sub(_world, _phisa, awfs);

       // if spin-polarized insert beta spin-orbital residual functions

       if (_params.spinpol)

       {

         vecfuncT br = sub(_world, _phisb, bwfs);

         rm.insert(rm.end(), br.begin(), br.end());

       }

       // scalar residual

       std::vector<double> rnvec = norm2s<valueT,NDIM>(_world, rm);

       double rnorm = 0.0;

       for (unsigned int i = 0; i < rnvec.size(); i++) rnorm += rnvec[i];

       // renormalize and print

       _residual = rnorm / rnvec.size();

       if (_world.rank() == 0) _outputF << "\nResiduals\n---------" << endl;

       if (_world.rank() == 0) _outputF << std::setiosflags(std::ios::scientific) << "residual = " << _residual << endl;

       if (_world.rank() == 0)

       {

         _outputF << endl;

         for (unsigned int i = 0; i < rnvec.size(); i++)

         {

           _outputF << "residual" << i << "\t" << rnvec[i] << endl;

         }

         _outputF << endl;

       }


       return rm;

     }


     //*************************************************************************

     void update_orbitals(vecfuncT& awfs,

                          vecfuncT& bwfs,

                          std::vector<KPoint> kpoints)

     {

       // truncate before we do anyting

       truncate<valueT,NDIM> (_world, awfs);

       truncate<valueT,NDIM> (_world, _phisa);

       if (_params.spinpol)

       {

         truncate<valueT,NDIM> (_world, bwfs);

         truncate<valueT,NDIM> (_world, _phisb);

       }

       // compute residual

       vecfuncT rm = compute_residual(awfs, bwfs);

       if (_params.solver > 0 && _params.maxsub > 1)

       {

         // nonlinear solver

         _subspace->update_subspace(awfs, bwfs, _phisa, _phisb, rm);

       }


       // do step restriction

       step_restriction(_phisa, awfs, 0);

       if (_params.spinpol)

       {

         step_restriction(_phisb, bwfs, 1);

       }

       // do gram-schmidt

       for (unsigned int kp = 0; kp < kpoints.size(); kp++)

       {

         gram_schmidt(awfs, kpoints[kp]);

 //        orthonormalize(awfs, kpoints[kp]);

         if (_params.spinpol)

         {

           gram_schmidt(bwfs, kpoints[kp]);

 //          orthonormalize(bwfs, kpoints[kp]);

         }

       }


       // update alpha and beta orbitals

       truncate<valueT,NDIM>(_world, awfs);

       for (unsigned int ai = 0; ai < awfs.size(); ai++) {

           _phisa[ai] = awfs[ai].scale(1.0 / awfs[ai].norm2());

       }

       if (_params.spinpol)

       {

         truncate<valueT,NDIM>(_world, bwfs);

         for (unsigned int bi = 0; bi < bwfs.size(); bi++)

         {

             _phisb[bi] = bwfs[bi].scale(1.0 / bwfs[bi].norm2());

         }

       }

       else

       {

         for (unsigned int ia = 0; ia < awfs.size(); ia++)

         {

           _phisb[ia] = _phisa[ia];

         }

       }

     }

     //*************************************************************************


     //*************************************************************************

     void step_restriction(vecfuncT& owfs,

                           vecfuncT& nwfs,

                           int aorb)

     {

       double s = (_it < 4) ? 0.75 : _params.sd;

       if (_world.rank() == 0) print("damping factor: ", s);

       for (unsigned int i = 0; i < owfs.size(); i++)

           nwfs[i].gaxpy(1.0 - s, owfs[i], s, false);

 //      std::vector<double> rnorm = norm2s(_world, sub(_world, owfs, nwfs));

 //      // Step restriction

 //      int nres = 0;

 //      for (unsigned int i = 0; i < owfs.size(); i++)

 //      {

 //        if (rnorm[i] > _params.maxrotn)

 //        {

 //          double s = _params.maxrotn / rnorm[i];

 //          nres++;

 //          if (_world.rank() == 0)

 //          {

 //            if (!aorb && nres == 1) _outputF << "  restricting step for alpha orbitals:" << endl;

 //            if (aorb && nres == 1) _outputF << "  restricting step for beta orbitals:" << endl;

 //            _outputF << i;

 //          }

 //          nwfs[i].gaxpy(s, owfs[i], 1.0 - s, false);

 //        }

 //      }

 //      if (nres > 0 && _world.rank() == 0) printf("\n");

 //      _world.gop.fence();

     }

     //*************************************************************************


     //*************************************************************************

     void fix_occupations(const std::vector<T>& eps,

                          std::vector<double>& occs)

     {

       // Find max/min eigenvalues

       double emax = eps[0];

       double emin = emax;

       for (int i = 0; i < eps.size(); i++)

       {

         emax = (eps[i] > emax) ? eps[i] : emax;

         emin = (eps[i] < emin) ? eps[i] : emin;

       }


       int maxits = 1000;

       // This is hardcoded to 2.0 (non-spinpolarized case) for now.

       double occmax = 2.0;

       // Fermi energy

       double efermi = 0.0;

       // Use bisection method to find the fermi energy and update occupation numbers

       bool bstop = false;

       // Some smoothing parameter

       double t1 = 1.0/_params.swidth;

       for (int it = 0; (it < maxits)&&(!bstop); it++)

       {

         // Proposed fermi energy

         efermi = 0.5 * (emax + emin);

         // Accumulated charge

         double charge = 0.0;

         // Loop over all eigenvalues and count the charge

         for (int i = 0; i < eps.size(); i++)

         {

           double x = (efermi-eps[i]) * t1;

           // need to add some smearing function here

           occs[i] = occmax*stheta_fd(x);

           charge += _kpoints[i].weight() * occs[i];

         }

         if (fabs(emax-emin) < 1e-5)

           bstop = true;

         else if (charge < _params.ncharge)

           emin = efermi;

         else

           emax = efermi;

       }

     }

     //*************************************************************************


 //    //*************************************************************************

 //    void update_eigenvalues(const vecfuncT& wavefs,

 //        const vecfuncT& pfuncs, const vecfuncT& phis,

 //        std::vector<T>& eigs)

 //    {

 //      // Update e

 //      if (_world.rank() == 0) printf("Updating e ...\n\n");

 //      for (unsigned int ei = 0; ei < eigs.size(); ei++)

 //      {

 //        functionT r = wavefs[ei] - phis[ei];

 //        double tnorm = wavefs[ei].norm2();

 //        // Compute correction to the eigenvalues

 //        T ecorrection = -0.5*real(inner(pfuncs[ei], r)) / (tnorm*tnorm);

 //        T eps_old = eigs[ei];

 //        T eps_new = eps_old + ecorrection;

 //        // Sometimes eps_new can go positive, THIS WILL CAUSE THE ALGORITHM TO CRASH. So,

 //        // I bounce the new eigenvalue back into the negative side of the real axis. I

 //        // keep doing this until it's good or I've already done it 10 times.

 //        int counter = 50;

 //        while (eps_new >= 0.0 && counter < 20)

 //        {

 //          // Split the difference between the new and old estimates of the

 //          // pi-th eigenvalue.

 //          eps_new = eps_old + 0.5 * (eps_new - eps_old);

 //          counter++;

 //        }

 //        // Still no go, forget about it. (1$ to Donnie Brasco)

 //        if (eps_new >= 0.0)

 //        {

 //          if (_world.rank() == 0) printf("FAILURE OF WST: exiting!!\n\n");

 //          _exit(0);

 //        }

 //        // Set new eigenvalue

 //        eigs[ei] = eps_new;

 //      }

 //    }

 //    //*************************************************************************


 //    //*************************************************************************

 //    double get_eig(int indx)

 //    {

 //      return _solver->get_eig(indx);

 //    }

 //    //*************************************************************************

 //

 //    //*************************************************************************

 //    functionT get_phi(int indx)

 //    {

 //      return _solver->get_phi(indx);

 //    }

 //    //*************************************************************************

 //

 //    //*************************************************************************

 //    const std::vector<double>& eigs()

 //    {

 //      return _solver->eigs();

 //    }

 //    //*************************************************************************

 //

 //    //*************************************************************************

 //    const vecfuncT& phis()

 //    {

 //      return _solver->phis();

 //    }

 //    //*************************************************************************


   };

   //***************************************************************************


 }

 #define SOLVER_H_


 #endif /* SOLVER_H_ */

madness::matrix_inner
void matrix_inner(DistributedMatrix< T > &A, const std::vector< Function< T, NDIM > > &f, const std::vector< Function< T, NDIM > > &g, bool sym=false)
Definition: chem/distpm.cc:38

thresh
const double thresh
Definition: dielectric.cc:185

madness::Solver::make_kinetic_matrix
tensor_complex make_kinetic_matrix(World &world, const vector_complex_function_3d &v, const KPoint &k)
Definition: solver.h:3538

madness::World::gop
WorldGopInterface & gop
Global operations.
Definition: worldfwd.h:462

fortran_ctypes.h
Corresponding C and Fortran types.

B
Tensor< double > B
Definition: tdse1d.cc:167

madness::tr1::shptr::shared_ptr< operatorT >

libxc.h

madness::Solver::apply_hf_exchange4
void apply_hf_exchange4(vecfuncT &phisa, vecfuncT &phisb, vecfuncT &funcsa, vecfuncT &funcsb, double &xc)
Definition: solver.h:2373

madness::reconstruct
void reconstruct(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Reconstruct a vector of functions.
Definition: vmra.h:149

madness::ElectronicStructureParams::centered
bool centered
Definition: electronicstructureparams.h:113

mpfr::exp
const mpreal exp(const mpreal &v, mp_rnd_t rnd_mode)
Definition: mpreal.h:2234

madness::constants::pi
const double pi
Mathematical constant pi.
Definition: constants.h:44

R
const double R
Definition: dielectric.cc:191

madness::ElectronicStructureParams::thresh
double thresh
Definition: electronicstructureparams.h:64

double_complex
std::complex< double > double_complex
Definition: lineplot.cc:16

poperator.h

mra.h
Main include file for MADNESS and defines Function interface.

madness::Function::truncate
Function< T, NDIM > & truncate(double tol=0.0, bool fence=true)
Truncate the function with optional fence. Compresses with fence if not compressed.
Definition: mra.h:577

std::tr1::f3
const T1 const T2 const T3 & f3
Definition: gtest-tuple.h:686

madness::Solver::do_rhs_simple
void do_rhs_simple(vecfuncT &wf, vecfuncT &vwf, std::vector< KPoint > kpoints, std::vector< T > &alpha, std::vector< double > &eigs)
Definition: solver.h:3209

madness::Solver::GuessDensity::operator()
double operator()(const coordT &x) const
Definition: solver.h:1134

madness::FunctionDefaults
FunctionDefaults holds default paramaters as static class members.
Definition: funcdefaults.h:175

madness::conj_transpose
Tensor< T > conj_transpose(const Tensor< T > &t)
Returns a new deep copy of the complex conjugate transpose of the input tensor.
Definition: tensor.h:1954

madness::ElectronicStructureParams::solver
int solver
Definition: electronicstructureparams.h:92

madness::FunctionDefaults::set_bc
static void set_bc(const BoundaryConditions< NDIM > &value)
Sets the default boundary conditions.
Definition: funcdefaults.h:350

madness::gaxpy
void gaxpy(World &world, Q alpha, std::vector< Function< T, NDIM > > &a, Q beta, const std::vector< Function< R, NDIM > > &b, bool fence=true)
Generalized A*X+Y for vectors of functions -— a[i] = alpha*a[i] + beta*b[i].
Definition: vmra.h:680

madness::WSTAtomicBasisFunctor::WSTAtomicBasisFunctor
WSTAtomicBasisFunctor(const AtomicBasisFunction &aofunc, double L, double kx, double ky, double kz)
Definition: solver.h:129

madness::ElectronicStructureParams::swidth
double swidth
Definition: electronicstructureparams.h:105

madness::ElectronicStructureParams::spinpol
bool spinpol
Definition: electronicstructureparams.h:56

madness::Solver::GuessDensity::GuessDensity
GuessDensity(const MolecularEntity &mentity, const AtomicBasisSet &aobasis, const double &R, const bool &periodic)
Definition: solver.h:1158

madness::SubspaceK::SubspaceK
SubspaceK(World &world, const ElectronicStructureParams &params, const std::vector< KPoint > &kpoints)
Definition: solver.h:232

madness::ComplexExp::coordT
Vector< double, NDIM > coordT
Definition: solver.h:101

madness::Subspace
The SubspaceK class is a container class holding previous orbitals and residuals. ...
Definition: solver.h:412

madness::WSTAtomicBasisFunctor::special_points
std::vector< coord_3d > special_points() const
Override this to return list of special points to be refined more deeply.
Definition: solver.h:159

NDIM
const int NDIM
Definition: tdse1.cc:44

madness::Solver::GuessDensity
Definition: solver.h:1128

madness::archive::ParallelOutputArchive
An archive for storing local or parallel data wrapping BinaryFstreamOutputArchive.
Definition: parar.h:241

madness::ComplexExp::vec3dT
Vector< double, NDIM > vec3dT
Definition: solver.h:102

madness::KPoint
Definition: eigsolver.h:63

madness::Vector< double, NDIM >

madness::Function::compress
const Function< T, NDIM > & compress(bool fence=true) const
Compresses the function, transforming into wavelet basis. Possible non-blocking comm.
Definition: mra.h:683

madness::Derivative
Implements derivatives operators with variety of boundary conditions on simulation domain...
Definition: derivative.h:272

madness::ElectronicStructureParams
Definition: electronicstructureparams.h:45

madness::Subspace::update_subspace
void update_subspace(vecfuncT &awfs_new, vecfuncT &bwfs_new, const vecfuncT &awfs_old, const vecfuncT &bwfs_old, const vecfuncT &rm)
Definition: solver.h:452

madness::Atom::z
double z
Definition: chem/molecule.h:57

madness::ElectronicStructureParams::L
double L
Definition: electronicstructureparams.h:48

madness::plotdx
void plotdx(const Function< T, NDIM > &f, const char *filename, const Tensor< double > &cell=FunctionDefaults< NDIM >::get_cell(), const std::vector< long > &npt=std::vector< long >(NDIM, 201L), bool binary=true)
Writes an OpenDX format file with a cube/slice of points on a uniform grid.
Definition: mraimpl.h:3228

madness::truncate
void truncate(World &world, std::vector< Function< T, NDIM > > &v, double tol=0.0, bool fence=true)
Truncates a vector of functions.
Definition: vmra.h:194

testing::internal::string
::std::string string
Definition: gtest-port.h:872

madness::SeparatedConvolution
Convolutions in separated form (including Gaussian)
Definition: operator.h:117

madness::ElectronicStructureParams::rcriterion
double rcriterion
Definition: electronicstructureparams.h:111

madness::ElectronicStructureParams::canon
bool canon
Definition: electronicstructureparams.h:90

madness::ElectronicStructureParams::periodic
bool periodic
Definition: electronicstructureparams.h:58

madness::DipoleFunctor
A MADNESS functor to compute either x, y, or z.
Definition: chem/SCF.h:194

madness::ElectronicStructureParams::fractional
bool fractional
Definition: electronicstructureparams.h:84

xc
XCfunctional xc
Definition: hedft.cc:54

madness::Solver::reproject
void reproject()
Definition: solver.h:2481

madness::f
NDIM & f
Definition: mra.h:2179

madness::BC_PERIODIC
Definition: funcdefaults.h:56

madness::World::size
ProcessID size() const
Returns the number of processes in this world (same as MPI_Comm_size())
Definition: worldfwd.h:533

madness::FunctionDefaults::get_thresh
static const double & get_thresh()
Returns the default threshold.
Definition: funcdefaults.h:225

solvers.h
Defines interfaces for optimization and non-linear equation solvers.

madness::AtomicBasisSet::get_atomic_basis_function
AtomicBasisFunction get_atomic_basis_function(const Molecule &molecule, int ibf) const
Returns the ibf'th atomic basis function.
Definition: chem/molecularbasis.h:474

madness::coordT
Vector< double, 3 > coordT
Definition: chem/corepotential.cc:57

madness::Solver::matrix_exponential
ctensorT matrix_exponential(const ctensorT &A)
Definition: solver.h:2793

madness::ComplexExp::exponent
const vec3dT exponent
Definition: solver.h:104

madness::Solver::make_lda_potential
rfunctionT make_lda_potential(World &world, const rfunctionT &arho, const rfunctionT &brho, const rfunctionT &adelrhosq, const rfunctionT &bdelrhosq)
Definition: solver.h:1237

esolver.h

madness::Solver::compute_rho_slow
rfunctionT compute_rho_slow(const vecfuncT &phis, std::vector< KPoint > kpoints, std::vector< double > occs)
Compute the electronic density for either a molecular or periodic system.
Definition: solver.h:2017

MolecularNuclearChargeDensityFunctor
Definition: electronicstructureapp.h:85

madness::Function::scale
Function< T, NDIM > & scale(const Q q, bool fence=true)
Inplace, scale the function by a constant. No communication except for optional fence.
Definition: mra.h:896

madness::arg
Tensor< typename Tensor< T >::scalar_type > arg(const Tensor< T > &t)
Return a new tensor holding the argument of each element of t (complex types only) ...
Definition: tensor.h:2429

madness::FunctionDefaults::get_cell
static const Tensor< double > & get_cell()
Gets the user cell for the simulation.
Definition: funcdefaults.h:369

world.h
This header should include pretty much everything needed for the parallel runtime.

madness::inner
T inner(const vecfunc< T, NDIM > &a, const vecfunc< T, NDIM > &b)
the non-linear solver requires an inner product
Definition: nemo.h:112

madness::MolecularPotentialFunctor
Definition: potentialmanager.h:54

madness::Solver::find_kpt_from_orb
KPoint find_kpt_from_orb(unsigned int idx)
Definition: solver.h:2360

madness::Solver::Q3
tensorT Q3(const tensorT &s)
Given overlap matrix, return rotation with 3rd order error to orthonormalize the vectors.
Definition: solver.h:3631

madness::norm2s
std::vector< double > norm2s(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norms of a vector of functions.
Definition: vmra.h:312

madness::ComplexExp::ComplexExp
ComplexExp(vec3dT exponent, double_complex coeff)
Definition: solver.h:106

madness::syev
void syev(const Tensor< T > &A, Tensor< T > &V, Tensor< typename Tensor< T >::scalar_type > &e)
Real-symmetric or complex-Hermitian eigenproblem.
Definition: lapack.cc:478

madness::Solver::init
void init(const std::string &filename)
Definition: solver.h:796

madness::Solver::END_TIMER
void END_TIMER(World &world, const char *msg)
Definition: solver.h:772

madness::abssq
Function< double, NDIM > abssq(const Function< double_complex, NDIM > &z, bool fence=true)
Returns a new function that is the square of the absolute value of the input.
Definition: mra.h:2255

madness::Solver::save_orbitals
void save_orbitals()
Definition: solver.h:928

madness::Solver::csqrt
ctensorT csqrt(const ctensorT &s, double tol=1e-8)
Computes matrix square root (not used any more?)
Definition: solver.h:3641

madness::Solver::Solver
Solver(World &world, const std::string &filename)
Definition: solver.h:778

madness::ElectronicStructureParams::ncharge
double ncharge
Definition: electronicstructureparams.h:103

madness::ElectronicStructureParams::plotorbs
bool plotorbs
Definition: electronicstructureparams.h:109

madness::functorT
std::shared_ptr< FunctionFunctorInterface< double, 3 > > functorT
Definition: chem/corepotential.cc:58

madness::Solver::genkmesh
std::vector< KPoint > genkmesh(unsigned int ngridk0, unsigned ngridk1, unsigned int ngridk2, double koffset0, double koffset1, double koffset2, double R)
Definition: solver.h:897

madness::ComplexExp::operator()
double_complex operator()(const coordT &x) const
You should implement this to return f(x)
Definition: solver.h:109

madness::AtomicBasisSet::nbf
int nbf(const Molecule &molecule) const
Given a molecule count the number of basis functions.
Definition: chem/molecularbasis.h:498

madness::Solver::orthonormalize
void orthonormalize(vecfuncT &wf, KPoint kpoint)
Definition: solver.h:3667

madness::Solver::Solver
Solver(World &world, const rfunctionT &vnucrhon, const vecfuncT &phis, const std::vector< T > &eigs, const ElectronicStructureParams &params, MolecularEntity mentity)
Definition: solver.h:1819

weight
FLOAT weight(const FLOAT &x)
Definition: y.cc:309

madness::WorldGopInterface::broadcast_serializable
void broadcast_serializable(objT &obj, ProcessID root)
Broadcast a serializable object.
Definition: worldgop.h:707

madness::Solver::GuessDensity::R
double R
Definition: solver.h:1131

madness::Function::norm2
double norm2() const
Returns the 2-norm of the function ... global sum ... works in either basis.
Definition: mra.h:650

std::tr1::T
const T1 &f1 return GTEST_2_TUPLE_() T(f0, f1)

max
#define max(a, b)
Definition: lda.h:53

madness::Solver::step_restriction
void step_restriction(vecfuncT &owfs, vecfuncT &nwfs, int aorb)
Definition: solver.h:3785

madness::vec
Vector< T, 1 > vec(T x)
Your friendly neighborhood factory function.
Definition: array.h:456

madness::scale
void scale(World &world, std::vector< Function< T, NDIM > > &v, const std::vector< Q > &factors, bool fence=true)
Scales inplace a vector of functions by distinct values.
Definition: vmra.h:290

madness::ElectronicStructureParams::functional
int functional
Definition: electronicstructureparams.h:52

madness::Function::reconstruct
void reconstruct(bool fence=true) const
Reconstructs the function, transforming into scaling function basis. Possible non-blocking comm...
Definition: mra.h:737

k
const int k
Definition: dielectric.cc:184

madness::Solver::initial_guess
void initial_guess()
Initializes alpha and beta mos, occupation numbers, eigenvalues.
Definition: solver.h:1323

madness::Solver::make_bsh_operators
std::vector< poperatorT > make_bsh_operators(const std::vector< T > &eigs)
Definition: solver.h:2088

madness::Solver::build_fock_matrix
tensorT build_fock_matrix(vecfuncT &psi, vecfuncT &vpsi, KPoint kpoint)
Definition: solver.h:3571

madness::FunctionDefaults::get_k
static int get_k()
Returns the default wavelet order.
Definition: funcdefaults.h:212

madness::AtomicBasisFunction
Used to represent one basis function from a shell on a specific center.
Definition: chem/molecularbasis.h:335

madness::ElectronicStructureParams::ngridk2
int ngridk2
Definition: electronicstructureparams.h:78

madness::AtomicBasisSet::read_file
void read_file(std::string filename)
read the atomic basis set from file
Definition: chem/molecularbasis.cc:107

madness::Solver
The main class of the periodic DFT solver .
Definition: solver.h:625

madness::copy
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence. ...
Definition: mra.h:1835

madness::ElectronicStructureParams::sd
double sd
Definition: electronicstructureparams.h:115

madness::Solver::sss
double sss
Definition: solver.h:767

complexfun.h

madness::Function::trace
T trace() const
Returns global value of int(f(x),x) ... global comm required.
Definition: mra.h:1034

MolecularEntity::total_nuclear_charge
double total_nuclear_charge() const
Definition: mentity.cc:444

mpfr::min
const mpreal min(const mpreal &x, const mpreal &y)
Definition: mpreal.h:2675

madness::sub
Function< TENSOR_RESULT_TYPE(L, R), NDIM > sub(const Function< L, NDIM > &left, const Function< R, NDIM > &right, bool fence=true)
Same as operator- but with optional fence and no automatic compression.
Definition: mra.h:1778

one
const complexd one(1, 0)

madness::ElectronicStructureParams::nempty
int nempty
Definition: electronicstructureparams.h:72

madness::ElectronicStructureParams::waveorder
int waveorder
Definition: electronicstructureparams.h:66

MolecularEntity
Definition: mentity.h:95

madness::ElectronicStructureParams::maxsub
unsigned int maxsub
Definition: electronicstructureparams.h:86

psi
double psi(const Vector< double, 3 > &r)
Definition: apps/ii/hatom_energy.cc:42

madness::ElectronicStructureParams::koffset0
double koffset0
Definition: electronicstructureparams.h:94

madness::ElectronicStructureParams::nelec
int nelec
Definition: electronicstructureparams.h:50

MolecularEntity::center
void center()
Moves the center of nuclear charge to the origin.
Definition: mentity.cc:413

madness::Solver::print_potential_matrix_eigs
void print_potential_matrix_eigs(const vecfuncT &wf, const vecfuncT &vwf)
Definition: solver.h:2850

madness::DipoleFunctor::operator()
double operator()(const coordT &x) const
Definition: solver.h:171

madness::Solver::load_orbitals
void load_orbitals()
Definition: solver.h:949

madness::ElectronicStructureParams::print_matrices
bool print_matrices
Definition: electronicstructureparams.h:107

MolecularEntity::read_file
void read_file(const std::string &filename, bool fractional)
Definition: mentity.cc:289

madness::Solver::gram_schmidt
void gram_schmidt(vecfuncT &f, KPoint kpoint)
Definition: solver.h:3614

madness::ElectronicStructureParams::basis
std::string basis
Definition: electronicstructureparams.h:96

madness::Solver::GuessDensity::mentity
const MolecularEntity & mentity
Definition: solver.h:1129

madness::ComplexExp::coeff
const double_complex coeff
Definition: solver.h:103

madness::Subspace::Subspace
Subspace(World &world, const ElectronicStructureParams &params)
Definition: solver.h:445

madness::Solver::ttt
double ttt
Definition: solver.h:767

madness::ElectronicStructureParams::nio
int nio
Definition: electronicstructureparams.h:98

madness::Solver::GuessDensity::aobasis
const AtomicBasisSet & aobasis
Definition: solver.h:1130

madness::Solver::print_fock_matrix_eigs
void print_fock_matrix_eigs(const vecfuncT &wf, const vecfuncT &vwf, KPoint kpoint)
Definition: solver.h:2879

madness::WorldGopInterface::sum
void sum(T *buf, size_t nelem)
Inplace global sum while still processing AM & tasks.
Definition: worldgop.h:767

sqrt
tensorT sqrt(const tensorT &s, double tol=1e-8)
Computes matrix square root (not used any more?)
Definition: DFcode/moldft.cc:446

madness::DipoleFunctor::~DipoleFunctor
virtual ~DipoleFunctor()
Definition: solver.h:174

madness::World
A parallel world with full functionality wrapping an MPI communicator.
Definition: worldfwd.h:416

MolecularEntity::get_atom
const Atom & get_atom(unsigned int i) const
Definition: mentity.cc:369

madness::WorldGopInterface::fence
void fence()
Synchronizes all processes in communicator AND globally ensures no pending AM or tasks.
Definition: worldgop.cc:52

madness::Solver::project_ao_basis
vecfuncT project_ao_basis(World &world, KPoint kpt)
Definition: solver.h:1250

madness::Solver::make_nuclear_potential
void make_nuclear_potential()
Definition: solver.h:1101

madness::norm2
double norm2(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norm of a vector of functions.
Definition: vmra.h:325

madness::Solver::compute_residual
vecfuncT compute_residual(const vecfuncT &awfs, const vecfuncT &bwfs)
Definition: solver.h:3690

potential
double potential(const coord_3d &r)
Definition: 3dharmonic.cc:133

madness::DipoleFunctor::DipoleFunctor
DipoleFunctor(int axis)
Definition: solver.h:170

madness::WSTAtomicBasisFunctor
Definition: solver.h:121

madness::ComplexExp
Definition: solver.h:99

madness::Atom::x
double x
Definition: chem/molecule.h:57

madness::ElectronicStructureParams::ngridk0
int ngridk0
Definition: electronicstructureparams.h:78

madness::Solver::set_occs2
void set_occs2(const std::vector< KPoint > &kpoints, const std::vector< double > &eigsa, const std::vector< double > &eigsb, std::vector< double > &occsa, std::vector< double > &occsb)
Definition: solver.h:1900

madness::Function
A multiresolution adaptive numerical function.
Definition: derivative.h:61

madness::Atom
Definition: chem/molecule.h:55

madness::AtomicBasisSet::eval_guess_density
double eval_guess_density(const Molecule &molecule, double x, double y, double z) const
Evaluates the guess density.
Definition: chem/molecularbasis.h:520

madness::cvecfuncT
std::vector< complex_functionT > cvecfuncT
Definition: chem/SCF.h:73

madness::ElectronicStructureParams::nbands
int nbands
Definition: electronicstructureparams.h:76

madness::ElectronicStructureParams::read_file
void read_file(const std::string &filename)
Definition: electronicstructureparams.h:170

rfunctorT
std::shared_ptr< FunctionFunctorInterface< double, 3 > > rfunctorT
Definition: esolver.h:46

madness::Solver::calculate_kinetic_energy
double calculate_kinetic_energy()
Definition: solver.h:2142

madness::Atom::y
double y
Definition: chem/molecule.h:57

madness::FunctionDefaults::set_thresh
static void set_thresh(double value)
Sets the default threshold.
Definition: funcdefaults.h:232

mpfr::sum
const mpreal sum(const mpreal tab[], unsigned long int n, mp_rnd_t rnd_mode)
Definition: mpreal.cc:241

madness::FunctionFunctorInterface
Abstract base class interface required for functors used as input to Functions.
Definition: function_interface.h:58

I
const complexd I(0, 1)

m
const double m
Definition: gfit.cc:199

rot
#define rot(x, k)
Definition: lookup3.c:72

madness::World::rank
ProcessID rank() const
Returns the process rank in this world (same as MPI_Comm_rank()))
Definition: worldfwd.h:526

madness::Solver::START_TIMER
void START_TIMER(World &world)
Definition: solver.h:768

madness::vector_complex_function_3d
std::vector< complex_function_3d > vector_complex_function_3d
Definition: functypedefs.h:86

madness::real
double real(double x)
Definition: complexfun.h:52

madness::mul_sparse
Function< TENSOR_RESULT_TYPE(L, R), NDIM > mul_sparse(const Function< L, NDIM > &left, const Function< R, NDIM > &right, double tol, bool fence=true)
Sparse multiplication — left and right must be reconstructed and if tol!=0 have tree of norms alread...
Definition: mra.h:1569

madness::plot_line
void plot_line(const char *filename, int npt, const Vector< double, NDIM > &lo, const Vector< double, NDIM > &hi, const Function< T, NDIM > &f)
Generates ASCII file tabulating f(r) at npoints along line r=lo,...,hi.
Definition: funcplot.h:388

madness::Solver::apply_potential
void apply_potential(vecfuncT &pfuncsa, vecfuncT &pfuncsb, const vecfuncT &phisa, const vecfuncT &phisb, const rfunctionT &rhoa, const rfunctionT &rhob, const rfunctionT &rho)
Applies the LDA effective potential to each orbital. Currently only lda and spin-polarized is not imp...
Definition: solver.h:2184

madness::abs
double abs(double x)
Definition: complexfun.h:48

madness::Solver::compute_rho
rfunctionT compute_rho(const vecfuncT &phis, std::vector< KPoint > kpoints, std::vector< double > occs)
Definition: solver.h:2049

madness::WSTAtomicBasisFunctor::~WSTAtomicBasisFunctor
~WSTAtomicBasisFunctor()
Definition: solver.h:139

madness::Solver::GuessDensity::periodic
const bool periodic
Definition: solver.h:1132

delta
const double delta
Definition: dielectric_external_field.cc:120

madness::Solver::Solver
Solver(World &world, rfunctionT vnucrhon, vecfuncT phis, std::vector< T > eigs, std::vector< KPoint > kpoints, std::vector< double > occs, ElectronicStructureParams params, MolecularEntity mentity)
Definition: solver.h:1854

madness::ElectronicStructureParams::ngridk1
int ngridk1
Definition: electronicstructureparams.h:78

electronicstructureparams.h

madness::FunctionDefaults::get_cell_width
static const Tensor< double > & get_cell_width()
Returns the width of each user cell dimension.
Definition: funcdefaults.h:391

madness::FunctionDefaults::set_cubic_cell
static void set_cubic_cell(double lo, double hi)
Sets the user cell to be cubic with each dimension having range [lo,hi].
Definition: funcdefaults.h:384

madness::Function::gaxpy
Function< T, NDIM > & gaxpy(const T &alpha, const Function< Q, NDIM > &other, const R &beta, bool fence=true)
Inplace, general bi-linear operation in wavelet basis. No communication except for optional fence...
Definition: mra.h:924

madness::Solver::~Solver
virtual ~Solver()
Definition: solver.h:1889

madness::ElectronicStructureParams::koffset2
double koffset2
Definition: electronicstructureparams.h:94

madness::Solver::make_nuclear_charge_density_impl
void make_nuclear_charge_density_impl()
Definition: solver.h:1049

madness::sygv
void sygv(const Tensor< T > &A, const Tensor< T > &B, int itype, Tensor< T > &V, Tensor< typename Tensor< T >::scalar_type > &e)
Generalized real-symmetric or complex-Hermitian eigenproblem.
Definition: lapack.cc:519

madness::Function::unaryop
void unaryop(T(*f)(T))
Inplace unary operation on function values.
Definition: mra.h:840

madness::Solver::make_nuclear_potential_impl
void make_nuclear_potential_impl()
Definition: solver.h:1041

op
Tensor< double > op(const Tensor< double > &x)
Definition: kain.cc:508

madness::Solver::apply_hf_exchange
void apply_hf_exchange(vecfuncT &phisa, vecfuncT &phisb, vecfuncT &funcsa, vecfuncT &funcsb)
Definition: solver.h:2413

madness::ElectronicStructureParams::restart
int restart
Definition: electronicstructureparams.h:101

std::tr1::f1
const T1 & f1
Definition: gtest-tuple.h:680

madness::ElectronicStructureParams::lo
double lo
Definition: electronicstructureparams.h:54

madness::AtomicBasisSet
Contracted Gaussian basis.
Definition: chem/molecularbasis.h:391

madness::print
void print(const A &a)
Print a single item to std::cout terminating with new line.
Definition: print.h:122

madness::project
Function< T, NDIM > project(const Function< T, NDIM > &other, int k=FunctionDefaults< NDIM >::get_k(), double thresh=FunctionDefaults< NDIM >::get_thresh(), bool fence=true)
Definition: mra.h:2162

MADNESS_EXCEPTION
#define MADNESS_EXCEPTION(msg, value)
Definition: worldexc.h:88

madness::Slice
A slice defines a sub-range or patch of a dimension.
Definition: slice.h:103

madness::Solver::update_orbitals
void update_orbitals(vecfuncT &awfs, vecfuncT &bwfs, std::vector< KPoint > kpoints)
Definition: solver.h:3723

madness::Function::thresh
double thresh() const
Returns value of truncation threshold. No communication.
Definition: mra.h:542

madness::ElectronicStructureParams::koffset1
double koffset1
Definition: electronicstructureparams.h:94

std::tr1::f2
const T1 const T2 & f2
Definition: gtest-tuple.h:680

madness::Solver::solve
void solve()
Definition: solver.h:2520

madness::FunctionFactory
FunctionFactory implements the named-parameter idiom for Function.
Definition: funcimpl.h:70

is_equal
bool is_equal(double val1, double val2, double eps)
Definition: esolver.h:190

mpfr::fabs
const mpreal fabs(const mpreal &v, mp_rnd_t rnd_mode)
Definition: mpreal.h:2187

madness::tensor_complex
Tensor< double_complex > tensor_complex
Definition: functypedefs.h:44

madness
Holds machinery to set up Functions/FuncImpls using various Factories and Interfaces.
Definition: chem/atomutil.cc:45

madness::stheta_fd
T stheta_fd(const T &x)
Definition: solver.h:76

madness::apply
Function< T, NDIM > apply(const Derivative< T, NDIM > &D, const Function< T, NDIM > &f, bool fence=true)
Applies derivative operator to function (for syntactic equivalence to integral operator apply) ...
Definition: derivative.h:613

c
const double c
Definition: gfit.cc:200

madness::KPoint::weight
double weight()
Definition: eigsolver.h:79

madness::transform
std::vector< Function< TENSOR_RESULT_TYPE(T, R), NDIM > > transform(World &world, const std::vector< Function< T, NDIM > > &v, const DistributedMatrix< R > &c, bool fence=true)
Definition: chem/SCF.cc:86

madness::wall_time
double wall_time()
Returns the wall time in seconds relative to arbitrary origin.
Definition: world.cc:248

madness::normalize
void normalize(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Normalizes a vector of functions — v[i] = v[i].scale(1.0/v[i].norm2())
Definition: vmra.h:765

madness::archive::ParallelInputArchive
An archive for storing local or parallel data wrapping BinaryFstreamInputArchive. ...
Definition: parar.h:266

madness::AtomicBasisFunction::get_coords
void get_coords(double &x, double &y, double &z) const
Definition: chem/molecularbasis.h:380

madness::Solver::apply_hf_exchange3
void apply_hf_exchange3(vecfuncT &phisa, vecfuncT &phisb, vecfuncT &funcsa, vecfuncT &funcsb, double &xc)
Definition: solver.h:2325

madness::Solver::print_tensor2d
void print_tensor2d(ostream &os, Tensor< Q > t)
Definition: solver.h:2834

madness::FunctionDefaults::set_k
static void set_k(int value)
Sets the default wavelet order.
Definition: funcdefaults.h:219

madness::Subspace::reproject
void reproject()
Definition: solver.h:563

MolecularEntity::natom
int natom() const
Definition: mentity.h:112

madness::WSTAtomicBasisFunctor::operator()
double_complex operator()(const coord_3d &x) const
Definition: solver.h:141

madness::SubspaceK
The SubspaceK class is a container class holding previous orbitals and residuals. ...
Definition: solver.h:193

madness::Solver::fix_occupations
void fix_occupations(const std::vector< T > &eps, std::vector< double > &occs)
Definition: solver.h:3817

madness::ElectronicStructureParams::ispotential
bool ispotential
Definition: electronicstructureparams.h:62

madness::conj
Function< T, NDIM > conj(const Function< T, NDIM > &f, bool fence=true)
Return the complex conjugate of the input function with the same distribution and optional fence...
Definition: mra.h:1879

madness::KAIN
Tensor< T > KAIN(const Tensor< T > &Q, double rcond=1e-12)
Solves non-linear equation using KAIN (returns coefficients to compute next vector) ...
Definition: solvers.h:98

madness::Solver::do_rhs
void do_rhs(vecfuncT &wf, vecfuncT &vwf, std::vector< KPoint > kpoints, std::vector< T > &alpha, std::vector< double > &eigs)
Definition: solver.h:2946

madness::SubspaceK::update_subspace
void update_subspace(vecfuncT &awfs_new, vecfuncT &bwfs_new, const vecfuncT &awfs_old, const vecfuncT &bwfs_old)
Definition: solver.h:246

madness::Solver::Solver
Solver(World &world, rfunctionT vnucrhon, vecfuncT phisa, vecfuncT phisb, std::vector< T > eigsa, std::vector< T > eigsb, ElectronicStructureParams params, MolecularEntity mentity)
Definition: solver.h:1296

madness::compress
void compress(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Compress a vector of functions.
Definition: vmra.h:130

madness::Solver::test_periodicity
void test_periodicity(const Function< Q, 3 > &f)
Definition: solver.h:1166

madness::ElectronicStructureParams::maxits
int maxits
Definition: electronicstructureparams.h:60