madness/api-doc/solver_8h_source.html

/*

  This file is part of MADNESS.


  Copyright (C) 2007,2010 Oak Ridge National Laboratory


  This program is free software; you can redistribute it and/or modify

  it under the terms of the GNU General Public License as published by

  the Free Software Foundation; either version 2 of the License, or

  (at your option) any later version.


  This program is distributed in the hope that it will be useful,

  but WITHOUT ANY WARRANTY; without even the implied warranty of

  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

  GNU General Public License for more details.


  You should have received a copy of the GNU General Public License

  along with this program; if not, write to the Free Software

  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA


  For more information please contact:


  Robert J. Harrison

  Oak Ridge National Laboratory

  One Bethel Valley Road

  P.O. Box 2008, MS-6367


  email: harrisonrj@ornl.gov

  tel:   865-241-3937

  fax:   865-572-0680

*/


#include <madness/mra/mra.h>

//#include <madness/mra/lbdeux.h>

#include <madness/world/MADworld.h>

#include <madness/tensor/solvers.h>

#include <vector>

#include <madness/fortran_ctypes.h>

#include <cmath>


#include "poperator.h"

#include "libxc.h"

#include "electronicstructureparams.h"

#include "complexfun.h"

#include "esolver.h"


#ifndef SOLVER_H_


using std::endl;

using std::setfill;

using std::setw;

using std::ostream;


/*!

  \ingroup applications

  \defgroup periodic_solver Periodic Solver

  \brief The Periodic Solver group is a group that contains the software

  objects that are needed to solve a periodic Kohn-Sham hamiltonian.

*/


//*****************************************************************************

/* static double onesfunc(const coordT& x) */

/* { */

/*   return 1.0; */

/* } */

//*****************************************************************************


namespace madness

{

  //***************************************************************************

  /*!

   \ingroup periodic_solver

   \Fermi-Dirac distribution function for fixing the occupation numbers

   */

  template <typename T>


  T stheta_fd(const T& x)

  {

    if (x > 50.0)

    {

      return 1.0;

    }

    else if (x < -50.0)

    {

      return 0.0;

    }

    else

    {

      return 1.0/(1.0 + exp(-x));

    }

  }


  //***************************************************************************


  // NOTE: so this is totally hacked because of the requirement of using a box

  //       of L*L*L rather than the convention of using a combination of

  //       lattice vectors and reciprocal lattice vectors (FOR NOW)

  // On second thought, it might be ok for general use if used "right".

  //***************************************************************************

  template <std::size_t NDIM>


  class ComplexExp : public FunctionFunctorInterface<double_complex,NDIM> {

  public:

      typedef Vector<double,NDIM> coordT;

      typedef Vector<double,NDIM> vec3dT;

      const double_complex coeff;

      const vec3dT exponent;


      ComplexExp(vec3dT exponent, double_complex coeff)

              : exponent(exponent), coeff(coeff) {}


      double_complex operator()(const coordT& x) const {

          double sum = 0.0;

          for (std::size_t i=0; i<NDIM; ++i) {

              sum += x[i]*exponent[i];

          };

          return coeff*exp(double_complex(0.0,sum));

      }


  };


  //***************************************************************************


  //***************************************************************************


  class WSTAtomicBasisFunctor : public FunctionFunctorInterface<double_complex,3> {

  private:

      const AtomicBasisFunction aofunc;

      double L;

      double kx, ky, kz;


      std::vector<coord_3d> specialpt;

  public:


      WSTAtomicBasisFunctor(const AtomicBasisFunction& aofunc, double L, double kx, double ky, double kz)

          : aofunc(aofunc), L(L), kx(kx), ky(ky), kz(kz)

      {

        double x, y, z;

          aofunc.get_coords(x,y,z);

          coord_3d r;

          r[0]=x; r[1]=y; r[2]=z;

          specialpt=std::vector<coord_3d>(1,r);

      }


      ~WSTAtomicBasisFunctor() {}


      double_complex operator()(const coord_3d& x) const {

          double_complex sum = 0.0;

          const int R = 1;

          const double_complex I = double_complex(0.0,1.0);

          for (int i=-R; i<=+R; i++) {

              double xx = x[0]+i*L;

              for (int j=-R; j<=+R; j++) {

                  double yy = x[1]+j*L;

                  for (int k=-R; k<=+R; k++) {

                      double zz = x[2]+k*L;

                      sum += -exp(-I*(kx*xx+ky*yy+kz*zz+constants::pi/2))*aofunc(xx, yy, zz);

                      //print(kx,ky,kz,exp(-I*(kx*xx+ky*yy+kz*zz+constants::pi/2)),aofunc(xx, yy, zz));

                  }

              }

          }

          return sum;

      }


      std::vector<coord_3d> special_points() const {return specialpt;}

  };


  //***************************************************************************


  /// A MADNESS functor to compute either x, y, or z

  //***************************************************************************


  class DipoleFunctor : public FunctionFunctorInterface<double,3> {

  private:

      const int axis;

  public:

      DipoleFunctor(int axis) : axis(axis) {}


      double operator()(const coordT& x) const {

          return x[axis];

      }


      virtual ~DipoleFunctor() {}

  };


  //***************************************************************************


  /*!

   \ingroup periodic_solver


   \brief The SubspaceK class is a container class holding previous orbitals

   and residuals.

   \par

   The Solver class uses the Krylov Accelerated Inexact Newton Solver (KAIN)

   accelerate the convergence a given calculation. The KAIN solver needs to

   store a subspace of previous orbitals and residuals. In the case is this

   implementation, the orbitals are store according to which k-point to which

   they belong.

  */


  //***************************************************************************

  template <typename T, int NDIM>


  class SubspaceK

  {

    // Typedef's

    typedef std::complex<T> valueT;

    typedef Function<valueT,NDIM> functionT;

    typedef std::vector<functionT> vecfuncT;

    typedef std::pair<vecfuncT,vecfuncT> pairvecfuncT;

    typedef std::vector<pairvecfuncT> subspaceT;

    typedef Tensor<valueT> tensorT;

    typedef std::vector<tensorT> vectensorT;

    typedef std::vector<subspaceT> vecsubspaceT;


    //*************************************************************************

    World& _world;

    //*************************************************************************


    //*************************************************************************

    vectensorT _Q;

    //*************************************************************************


    //*************************************************************************

    vecsubspaceT _subspace;

    //*************************************************************************


    //*************************************************************************

    std::vector<KPoint> _kpoints;

    //*************************************************************************


    //*************************************************************************

    ElectronicStructureParams _params;

    //*************************************************************************


    //*************************************************************************

    double _residual;

    //*************************************************************************


  public:


    //*************************************************************************


    SubspaceK(World& world, const ElectronicStructureParams& params,

            const std::vector<KPoint>& kpoints) : _world(world), _kpoints(kpoints),

            _params(params)

    {

      _residual = 1e6;

      for (unsigned int kp = 0; kp < _kpoints.size(); kp++)

      {

        _Q.push_back(tensorT(1,1));

        _subspace.push_back(subspaceT());

      }

    }


    //*************************************************************************


    //*************************************************************************


    void update_subspace(vecfuncT& awfs_new,

                         vecfuncT& bwfs_new,

                         const vecfuncT& awfs_old,

                         const vecfuncT& bwfs_old)

    {

      // compute residuals (total)

      vecfuncT t_rm = sub(_world, awfs_old, awfs_new);

      if (_params.spinpol)

      {

        vecfuncT br = sub(_world, bwfs_old, bwfs_new);

        t_rm.insert(t_rm.end(), br.begin(), br.end());

      }

      std::vector<double> rnvec = norm2<valueT,NDIM>(_world, t_rm);

      if (_world.rank() == 0)

      {

        double rnorm = 0.0;

        for (unsigned int i = 0; i < rnvec.size(); i++) rnorm += rnvec[i];

        if (_world.rank() == 0) print("residual = ", rnorm);

        _residual = rnorm;

      }

      _world.gop.broadcast(_residual, 0);


      for (unsigned int kp = 0; kp < _kpoints.size(); kp++)

      {

        KPoint kpoint = _kpoints[kp];


        vecfuncT k_phisa(awfs_old.begin() + kpoint.begin, awfs_old.begin() + kpoint.end);

        vecfuncT k_phisb(bwfs_old.begin() + kpoint.begin, bwfs_old.begin() + kpoint.end);

        vecfuncT k_awfs(awfs_new.begin() + kpoint.begin, awfs_new.begin() + kpoint.end);

        vecfuncT k_bwfs(bwfs_new.begin() + kpoint.begin, bwfs_new.begin() + kpoint.end);


        // compute residuals for k-point

        // concatentate up and down spins

        vecfuncT k_rm = sub(_world, k_phisa, k_awfs);

        vecfuncT k_vm(k_phisa);

        if (_params.spinpol)

        {

          vecfuncT k_br = sub(_world, k_phisb, k_bwfs);

          k_rm.insert(k_rm.end(), k_br.begin(), k_br.end());

          k_vm.insert(k_vm.end(), k_phisb.begin(), k_phisb.end());

        }


        // Update subspace and matrix Q

        compress(_world, k_vm, false);

        compress(_world, k_rm, false);

        _world.gop.fence();

        subspaceT k_subspace = _subspace[kp];

        k_subspace.push_back(pairvecfuncT(k_vm,k_rm));


        int m = k_subspace.size();

        tensorT ms(m);

        tensorT sm(m);

        for (int s = 0; s < m; s++)

        {

            const vecfuncT& k_vs = k_subspace[s].first;

            const vecfuncT& k_rs = k_subspace[s].second;

            for (unsigned int i = 0; i < k_vm.size(); i++)

            {

                ms[s] += k_vm[i].inner_local(k_rs[i]);

                sm[s] += k_vs[i].inner_local(k_rm[i]);

            }

        }

        _world.gop.sum(ms.ptr(),m);

        _world.gop.sum(sm.ptr(),m);


        tensorT newQ(m,m);

        if (m > 1) newQ(Slice(0,-2),Slice(0,-2)) = _Q[kp];

        newQ(m-1,_) = ms;

        newQ(_,m-1) = sm;


        _Q[kp] = newQ;

        if (_world.rank() == 0) print(_Q[kp]);


        // Solve the subspace equations

        tensorT c;

        if (_world.rank() == 0) {

            double rcond = 1e-12;

            while (1) {

                c = KAIN(_Q[kp],rcond);

                if (abs(c[m-1]) < 3.0) {

                    break;

                }

                else if (rcond < 0.01) {

                    if (_world.rank() == 0)

                      print("Increasing subspace singular value threshold ", c[m-1], rcond);

                    rcond *= 100;

                }

                else {

                    if (_world.rank() == 0)

                      print("Forcing full step due to subspace malfunction");

                    c = 0.0;

                    c[m-1] = 1.0;

                    break;

                }

            }

        }


        _world.gop.broadcast_serializable(c, 0);

        if (_world.rank() == 0) {

            //print("Subspace matrix");

            //print(Q);

            print("Subspace solution", c);

        }


        // Form linear combination for new solution

        vecfuncT k_phisa_new = zero_functions_compressed<valueT,NDIM>(_world, k_phisa.size());

        vecfuncT k_phisb_new = zero_functions_compressed<valueT,NDIM>(_world, k_phisb.size());

        std::complex<double> one = std::complex<double>(1.0,0.0);

        unsigned int norbitals = awfs_old.size() / _kpoints.size();

        for (unsigned int m = 0; m < k_subspace.size(); m++)

        {

            const vecfuncT& k_vm = k_subspace[m].first;

            const vecfuncT& k_rm = k_subspace[m].second;

            // WSTHORNTON Stopped here!

            const vecfuncT  vma(k_vm.begin(),k_vm.begin() + norbitals);

            const vecfuncT  rma(k_rm.begin(),k_rm.begin() + norbitals);

            const vecfuncT  vmb(k_vm.end() - norbitals, k_vm.end());

            const vecfuncT  rmb(k_rm.end() - norbitals, k_rm.end());


            gaxpy(_world, one, k_phisa_new, c(m), vma, false);

            gaxpy(_world, one, k_phisa_new,-c(m), rma, false);

            gaxpy(_world, one, k_phisb_new, c(m), vmb, false);

            gaxpy(_world, one, k_phisb_new,-c(m), rmb, false);

        }

        _world.gop.fence();


        if (_params.maxsub <= 1) {

            // Clear subspace if it is not being used

            k_subspace.clear();

        }

        else if (k_subspace.size() == _params.maxsub) {

            // Truncate subspace in preparation for next iteration

            k_subspace.erase(k_subspace.begin());

            _Q[kp] = _Q[kp](Slice(1,-1),Slice(1,-1));

        }

        // Save subspace

        _subspace[kp] = k_subspace;


        for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

          wi++, fi++)

        {

          awfs_new[wi] = k_phisa_new[fi];

          bwfs_new[wi] = k_phisb_new[fi];

        }

      }

    }


    //*************************************************************************


  };


  /*!

   \ingroup periodic_solver


   \brief The SubspaceK class is a container class holding previous orbitals

   and residuals.

   \par

   The Solver class uses the Krylov Accelerated Inexact Newton Solver (KAIN)

   accelerate the convergence a given calculation. The KAIN solver needs to

   store a subspace of previous orbitals and residuals.

  */


  //***************************************************************************

  template <typename T, int NDIM>


  class Subspace

  {

    // Typedef's

    typedef std::complex<T> valueT;

    typedef Function<valueT,NDIM> functionT;

    typedef std::vector<functionT> vecfuncT;

    typedef std::pair<vecfuncT,vecfuncT> pairvecfuncT;

    typedef std::vector<pairvecfuncT> subspaceT;

    typedef Tensor<valueT> tensorT;


    //*************************************************************************

    World& _world;

    //*************************************************************************


    //*************************************************************************

    tensorT _Q;

    //*************************************************************************


    //*************************************************************************

    subspaceT _subspace;

    //*************************************************************************


    //*************************************************************************

    std::vector<KPoint> _kpoints;

    //*************************************************************************


    //*************************************************************************

    ElectronicStructureParams _params;

    //*************************************************************************


  public:


    //*************************************************************************


    Subspace(World& world, const ElectronicStructureParams& params)

      : _world(world), _params(params)

    {

    }


    //*************************************************************************


    //*************************************************************************


    void update_subspace(vecfuncT& awfs_new,

                         vecfuncT& bwfs_new,

                         const vecfuncT& awfs_old,

                         const vecfuncT& bwfs_old,

                         const vecfuncT& rm)

    {

      // concatentate up and down spins

      vecfuncT vm = awfs_old;

      if (_params.spinpol)

      {

        vm.insert(vm.end(), bwfs_old.begin(), bwfs_old.end());

      }


      // Update subspace and matrix Q

      compress(_world, vm, false);

      compress(_world, rm, false);

      _world.gop.fence();

      _subspace.push_back(pairvecfuncT(vm,rm));


      int m = _subspace.size();

      tensorT ms(m);

      tensorT sm(m);

      for (int s=0; s<m; s++)

      {

          const vecfuncT& vs = _subspace[s].first;

          const vecfuncT& rs = _subspace[s].second;

          for (unsigned int i=0; i<vm.size(); i++)

          {

              ms[s] += vm[i].inner_local(rs[i]);

              sm[s] += vs[i].inner_local(rm[i]);

          }

      }

      _world.gop.sum(ms.ptr(),m);

      _world.gop.sum(sm.ptr(),m);


      tensorT newQ(m,m);

      if (m > 1) newQ(Slice(0,-2),Slice(0,-2)) = _Q;

      newQ(m-1,_) = ms;

      newQ(_,m-1) = sm;


      _Q = newQ;

      if (_world.rank() == 0) print(_Q);


      // Solve the subspace equations

      tensorT c;

      if (_world.rank() == 0) {

          double rcond = 1e-12;

          while (1) {

              c = KAIN(_Q,rcond);

              if (abs(c[m-1]) < 3.0) {

                  break;

              }

              else if (rcond < 0.01) {

                  if (_world.rank() == 0)

                    print("Increasing subspace singular value threshold ", c[m-1], rcond);

                  rcond *= 100;

              }

              else {

                  if (_world.rank() == 0)

                    print("Forcing full step due to subspace malfunction");

                  c = 0.0;

                  c[m-1] = 1.0;

                  break;

              }

          }

      }


      _world.gop.broadcast_serializable(c, 0);

      if (_world.rank() == 0) {

          //print("Subspace matrix");

          //print(Q);

          print("Subspace solution", c);

      }


      // Form linear combination for new solution

      vecfuncT phisa_new = zero_functions_compressed<valueT,NDIM>(_world, awfs_old.size());

      vecfuncT phisb_new = zero_functions_compressed<valueT,NDIM>(_world, bwfs_old.size());

      std::complex<double> one = std::complex<double>(1.0,0.0);

      for (unsigned int m=0; m<_subspace.size(); m++) {

          const vecfuncT& vm = _subspace[m].first;

          const vecfuncT& rm = _subspace[m].second;

          const vecfuncT  vma(vm.begin(),vm.begin()+awfs_old.size());

          const vecfuncT  rma(rm.begin(),rm.begin()+awfs_old.size());

          const vecfuncT  vmb(vm.end()-bwfs_old.size(), vm.end());

          const vecfuncT  rmb(rm.end()-bwfs_old.size(), rm.end());


          gaxpy(_world, one, phisa_new, c(m), vma, false);

          gaxpy(_world, one, phisa_new,-c(m), rma, false);

          gaxpy(_world, one, phisb_new, c(m), vmb, false);

          gaxpy(_world, one, phisb_new,-c(m), rmb, false);

      }

      _world.gop.fence();


      if (_params.maxsub <= 1) {

          // Clear subspace if it is not being used

          _subspace.clear();

      }

      else if (_subspace.size() == _params.maxsub) {

          // Truncate subspace in preparation for next iteration

          _subspace.erase(_subspace.begin());

          _Q = _Q(Slice(1,-1),Slice(1,-1));

      }

      awfs_new = phisa_new;

      bwfs_new = phisb_new;

    }


    //*************************************************************************


    //*************************************************************************


    void reproject()

    {

      //  //if (_world.rank() == 0)

      //    //printf("\n\nreprojecting subspace to wavelet order: %d and thresh: %.5e\n\n",

      //    //FunctionDefaults<3>::get_k(), FunctionDefaults<3>::get_thresh());

      //

      //  unsigned int m = _subspace.size();

      //  for (unsigned int s = 0; s < m; s++)

      //  {

      //      vecfuncT& vs = _subspace[s].first;

      //      vecfuncT& rs = _subspace[s].second;

      //      reconstruct(_world, vs);

      //      reconstruct(_world, rs);

      //      unsigned int vm = vs.size();

      //      for (unsigned int i = 0; i < vm; i++)

      //      {

      //        vs[i] = madness::project(vs[i], FunctionDefaults<3>::get_k(),

      //          FunctionDefaults<3>::get_thresh(), false);

      //        rs[i] = madness::project(rs[i], FunctionDefaults<3>::get_k(),

      //          FunctionDefaults<3>::get_thresh(), false);

      //      }

      //      _world.gop.fence();

      //      truncate(_world, vs);

      //      truncate(_world, rs);

      //      normalize(_world, vs);

      //  }

      //  _world.gop.fence();


    }


    //*************************************************************************


  };


//  template <typename T, int NDIM>

//  struct lbcost {

//      double leaf_value;

//      double parent_value;

//      lbcost(double leaf_value=1.0, double parent_value=0.0) : leaf_value(leaf_value), parent_value(parent_value) {}

//      double operator()(const Key<NDIM>& key, const FunctionNode<T,NDIM>& node) const {

//          if (key.level() <= 1) {

//              return 100.0*(leaf_value+parent_value);

//          }

//          else if (node.is_leaf()) {

//              return leaf_value;

//          }

//          else {

//              return parent_value;

//          }

//      }

//  };


  //***************************************************************************


  /*! \ingroup periodic_solver

      \brief The main class of the periodic DFT solver

      \f[

      z = frac{x}{1 - y^2}

      \f]

  */


  //***************************************************************************

  template <typename T, int NDIM>


  class Solver

  {

    // Typedef's

    typedef std::complex<T> valueT;

    typedef Function<T,NDIM> rfunctionT;

    typedef FunctionFactory<T,NDIM> rfactoryT;

    typedef Function<valueT,NDIM> functionT;

    typedef std::vector<functionT> vecfuncT;

    typedef FunctionFactory<valueT,NDIM> factoryT;

    typedef Vector<double,NDIM> kvecT;

    typedef SeparatedConvolution<T,3> operatorT;

    typedef std::shared_ptr<operatorT> poperatorT;

    typedef Tensor<double> rtensorT;

    typedef Tensor<std::complex<double> > ctensorT;

    typedef Tensor<valueT> tensorT;

    typedef std::pair<vecfuncT,vecfuncT> pairvecfuncT;

    typedef std::vector<pairvecfuncT> subspaceT;

    typedef std::vector<tensorT> vectensorT;

    typedef std::vector<subspaceT> vecsubspaceT;


    //*************************************************************************

    World& _world;

    //*************************************************************************


    //*************************************************************************

    // This variable could either be a nuclear potiential or a nuclear charge

    // density depending on the "ispotential" boolean variable in the

    // ElectronicStructureParams class.

    rfunctionT _vnucrhon;

    //*************************************************************************


    //*************************************************************************

    vecfuncT _phisa;

    //*************************************************************************


    //*************************************************************************

    vecfuncT _phisb;

    //*************************************************************************


    //*************************************************************************

    std::vector<T> _eigsa;

    //*************************************************************************


    //*************************************************************************

    std::vector<T> _eigsb;

    //*************************************************************************


    //*************************************************************************

    ElectronicStructureParams _params;

    //*************************************************************************


    //*************************************************************************

    std::vector<KPoint> _kpoints;

    //*************************************************************************


    //*************************************************************************

    std::vector<double> _occsa;

    //*************************************************************************


    //*************************************************************************

    std::vector<double> _occsb;

    //*************************************************************************


    //*************************************************************************

    rfunctionT _rhoa;

    //*************************************************************************


    //*************************************************************************

    rfunctionT _rhob;

    //*************************************************************************


    //*************************************************************************

    rfunctionT _rho;

    //*************************************************************************


    //*************************************************************************

    rfunctionT _vnuc;

    //*************************************************************************


    //*************************************************************************

    SeparatedConvolution<T,NDIM>* _cop;

    //*************************************************************************


//    //*************************************************************************

//    vecsubspaceT _subspace;

//    //*************************************************************************

//

//    //*************************************************************************

//    vectensorT _Q;

//    //*************************************************************************


    //*************************************************************************

    Subspace<T,NDIM>* _subspace;

    //*************************************************************************


    //*************************************************************************

    MolecularEntity _mentity;

    //*************************************************************************


    //*************************************************************************

    double _residual;

    //*************************************************************************


    //*************************************************************************

    AtomicBasisSet _aobasis;

    //*************************************************************************


    //*************************************************************************

    double _maxthresh;

    //*************************************************************************


    //*************************************************************************

    std::ofstream _outputF;

    //*************************************************************************


    //*************************************************************************

    std::ofstream _matF;

    //*************************************************************************


    //*************************************************************************

    std::ofstream _eigF;

    //*************************************************************************


    //*************************************************************************

    std::ofstream _kmeshF;

    //*************************************************************************


    //*************************************************************************

    int _it;

    //*************************************************************************


    //*************************************************************************

    cvecfuncT _aobasisf;

    //*************************************************************************


    //*************************************************************************

    int _nao;

    //*************************************************************************


  public:


    //*************************************************************************

    double ttt, sss;


    void START_TIMER(World& world) {

        world.gop.fence(); ttt=wall_time(); sss=cpu_time();

    }


    void END_TIMER(World& world, const char* msg) {

    ttt=wall_time()-ttt; sss=cpu_time()-sss; if (world.rank()==0) printf("timer: %20.20s %8.2fs %8.2fs\n", msg, sss, ttt);

    }


    //*************************************************************************


    //*************************************************************************


    Solver(World& world, const std::string& filename) : _world(world)

    {

      init(filename);

      if (_params.periodic) FunctionDefaults<3>::set_bc(BC_PERIODIC);

      _residual = 1e5;

      make_nuclear_potential();


      if (_params.restart==0) initial_guess();

//      for (unsigned int kp = 0; kp < _kpoints.size(); kp++)

//      {

//        _Q.push_back(tensorT(1,1));

//        _subspace.push_back(subspaceT());

//      }

      _subspace = new Subspace<T,NDIM>(world, _params);

    }


    //*************************************************************************


    //*************************************************************************


    void init(const std::string& filename)

    {


      // params

      if (_world.rank() == 0)

      {

        _params.read_file(filename);

        //_params.fractional = false;

      }

      // Send params

      _world.gop.broadcast_serializable(_params, 0);

      if (_params.centered)

        FunctionDefaults<3>::set_cubic_cell(-_params.L/2,_params.L/2);

      else

        FunctionDefaults<3>::set_cubic_cell(-_params.L/2,_params.L/2);

//        FunctionDefaults<3>::set_cubic_cell(0,_params.L);

      FunctionDefaults<3>::set_thresh(_params.thresh);

      FunctionDefaults<3>::set_k(_params.waveorder);


      // mentity and aobasis

      if (_world.rank() == 0)

      {

        _aobasis.read_file(_params.basis);

        _mentity.read_file(filename, _params.fractional);

        if (_params.centered) _mentity.center();

      }

      // Send mentity and aobasis

      _world.gop.broadcast_serializable(_mentity, 0);

      _world.gop.broadcast_serializable(_aobasis, 0);

      // set number of electrons to the total nuclear charge of the mentity

      _params.nelec = _mentity.total_nuclear_charge();

      // total number of bands include empty

      _params.nbands = (_params.nelec/2) + _params.nempty;

      _params.ncharge = _mentity.total_nuclear_charge();

      if ((_params.nelec % 2) == 1) _params.nelec++;


      // Open output files

      _outputF.open("output.txt");

      _matF.open("matrix.txt");

      _eigF.open("eigs.txt");


      // kmesh

      if (_params.restart == 0)

      {

        if (_params.periodic) // PERIODIC

        {

          // GAMMA POINT

          if ((_params.ngridk0 == 1) && (_params.ngridk1 == 1) && (_params.ngridk2 == 1))

          {

            _kpoints.push_back(KPoint(coordT(0.0), 1.0));

          }

          if ((_params.ngridk0 == 0) && (_params.ngridk1 == 0) && (_params.ngridk2 == 0))

          {

            double TWO_PI = 2.0 * madness::constants::pi;

            double t1 = TWO_PI/_params.L;

            coordT c1 {0.0,0.0,0.0};

            coordT c2 {0.5*t1,0.5*t1,0.5*t1};

            _kpoints.push_back(KPoint(c1, 0.5));

            _kpoints.push_back(KPoint(c2, 0.5));

          }

          else // NORMAL BANDSTRUCTURE

          {

            _kpoints = genkmesh(_params.ngridk0, _params.ngridk1,

                                _params.ngridk2, _params.koffset0,

                                _params.koffset1, _params.koffset2,

                                _params.L);

          }

        }

        else // NOT-PERIODIC

        {

          _kpoints.push_back(KPoint(coordT(0.0), 1.0));

        }

        if (_world.rank() == 0)

        {

          _kmeshF.open("kpoints.txt");

          _kmeshF << "kpts: " << _kpoints.size() << endl;

          _kmeshF << "ik" << setw(10) << "kpt" << setw(30) << "weight" << endl;

          _kmeshF << "--" << setw(10) << "---" << setw(30) << "------" << endl;


          //_kmeshF << setfill('-') << setw(55) << "-" << endl;

          //_kmeshF << setfill(' ') << endl;

          _kmeshF << endl;

          for (unsigned int i = 0; i < _kpoints.size(); i++)

          {

            KPoint kpoint = _kpoints[i];

            _kmeshF << i << setw(10) << kpoint.k[0];

            _kmeshF << setw(10) << kpoint.k[1];

            _kmeshF << setw(10) << kpoint.k[2];

            _kmeshF << setw(10) << kpoint.weight << endl;

          }

          _kmeshF.close();

        }

      }

      else

      {

        load_orbitals();

      }

    }


    //*************************************************************************


    //*************************************************************************


    std::vector<KPoint> genkmesh(unsigned int ngridk0, unsigned ngridk1, unsigned int ngridk2,

                                 double koffset0, double koffset1, double koffset2, double R)

    {

      std::vector<KPoint> kmesh;

      double step0 = 1.0/ngridk0;

      double step1 = 1.0/ngridk1;

      double step2 = 1.0/ngridk2;

      double weight = 1.0/(ngridk0*ngridk1*ngridk2);

      double TWO_PI = 2.0 * madness::constants::pi;

      for (unsigned int i = 0; i < ngridk0; i++)

      {

        for (unsigned int j = 0; j < ngridk1; j++)

        {

          for (unsigned int k = 0; k < ngridk2; k++)

          {

            //double k0 = (i*step0 - step0/2) * TWO_PI/R;

            //double k1 = (j*step1 - step1/2) * TWO_PI/R;

            //double k2 = (k*step2 - step2/2) * TWO_PI/R;

            double k0 = ((i*step0)+koffset0) * TWO_PI/R;

            double k1 = ((j*step1)+koffset1) * TWO_PI/R;

            double k2 = ((k*step2)+koffset2) * TWO_PI/R;

            KPoint kpoint(k0, k1, k2, weight);

            kmesh.push_back(kpoint);

          }

        }

      }

      return kmesh;

    }


    //*************************************************************************


    //*************************************************************************


    void save_orbitals()

    {

      archive::ParallelOutputArchive ar(_world, "orbitals", _params.nio);

      ar & _params.spinpol;

      ar & (unsigned int)(_kpoints.size());

      for (unsigned int i = 0; i < _kpoints.size(); i++) ar & _kpoints[i];

//      ar & (unsigned int)(_occsa.size());

//      for (unsigned int i = 0; i < _occsa.size(); i++) ar & _occsa[i];

      ar & (unsigned int)(_phisa.size());

      for (unsigned int i = 0; i < _phisa.size(); i++) ar & _phisa[i];

      if (_params.spinpol)

      {

//        ar & (unsigned int)(_occsb.size());

//        for (unsigned int i = 0; i < _occsb.size(); i++) ar & _occsb[i];

        ar & (unsigned int)(_phisb.size());

        for (unsigned int i = 0; i < _phisb.size(); i++) ar & _phisb[i];

      }

    }


    //*************************************************************************


    //*************************************************************************


    void load_orbitals()

    {

      const double thresh = FunctionDefaults<3>::get_thresh();

      const int k = FunctionDefaults<3>::get_k();


      archive::ParallelInputArchive ar(_world, "orbitals");


      // spin-polarized

      bool spinrest;

      ar & spinrest;

      // kpoints

      unsigned int nkpts;

      ar & nkpts;

      _kpoints.clear();

      for (unsigned int i = 0; i < nkpts; i++)

      {

        KPoint tkpt;

        ar & tkpt;

        _kpoints.push_back(tkpt);

      }

      // occs

//      unsigned int noccs;

//      ar & noccs;

//      _occs.clear();

//      for (unsigned int i = 0; i < noccs; i++)

//      {

//        double tocc;

//        ar & tocc;

//        _occs.push_back(tocc);

//      }

      // orbitals

      unsigned int norbs;

      ar & norbs;

      _phisa.clear();

      _eigsa.clear();

      for (unsigned int i = 0; i < norbs; i++)

      {

        functionT tfunc;

        ar & tfunc;

        _phisa.push_back(tfunc);

        _eigsa.push_back(-0.1);

      }

      // check for k mismatch

      if (_phisa[0].k() != k)

      {

        reconstruct(_world,_phisa);

        for (unsigned int i = 0; i < _phisa.size(); i++)

          _phisa[i] = madness::project(_phisa[i], k, thresh, false);

        _world.gop.fence();

      }

      // orthonormalize

      for (unsigned int i = 0; i < _kpoints.size(); i++)

        gram_schmidt(_phisa, _kpoints[i]);


      if (_params.spinpol)

      {

        _phisb.clear();

        _eigsb.clear();

        for (unsigned int i = 0; i < norbs; i++)

        {

          functionT tfunc;

          ar & tfunc;

          _phisb.push_back(tfunc);

          _eigsb.push_back(-0.1);

        }

        // check for k mismatch

        if (_phisb[0].k() != k)

        {

          reconstruct(_world,_phisb);

          for (unsigned int i = 0; i < _phisb.size(); i++)

            _phisb[i] = madness::project(_phisb[i], k, thresh, false);

          _world.gop.fence();

        }

        // orthonormalize

        for (unsigned int i = 0; i < _kpoints.size(); i++)

          gram_schmidt(_phisb, _kpoints[i]);

      }

      else

      {

        for (unsigned int i = 0; i < norbs; i++)

        {

          _phisb.push_back(_phisa[i]);

          _eigsb.push_back(_eigsa[i]);

        }

      }

      // create vector for occupation numbers

      _occsa = std::vector<double>(norbs, 0.0);

      _occsb = std::vector<double>(norbs, 0.0);

    }


    //*************************************************************************


    //*************************************************************************


    void make_nuclear_potential_impl()

    {

      _vnucrhon = rfactoryT(_world).functor(rfunctorT(new MolecularPotentialFunctor(_mentity))).thresh(_params.thresh * 0.1).truncate_on_project();

      _vnuc = copy(_vnucrhon);

    }


    //*************************************************************************


    //*************************************************************************


    void make_nuclear_charge_density_impl()

    {

      std::vector<coordT> specialpts;

      for (int i = 0; i < _mentity.natom(); i++)

      {

        coordT pt(0.0);

        Atom atom = _mentity.get_atom(i);

        pt[0] = atom.x; pt[1] = atom.y; pt[2] = atom.z;

        specialpts.push_back(pt);

        if (_world.rank() == 0) print("Special point: ", pt);

      }

      double now = wall_time();

      std::cout << "THE FUNCTOR IS " << MolecularNuclearChargeDensityFunctor(_mentity, _params.L, _params.periodic, specialpts)(specialpts[0]) << endl;

      // WSTHORNTON

      //MADNESS_ASSERT(false);


      _vnucrhon = rfactoryT(_world).functor(

          rfunctorT(new MolecularNuclearChargeDensityFunctor(_mentity, _params.L, _params.periodic, specialpts))).

          thresh(_params.thresh).initial_level(6).truncate_on_project();


      if (_world.rank() == 0) printf("%f\n", wall_time() - now);

      if (_world.rank() == 0) print("calculating trace of rhon ..\n\n");

      double rtrace = _vnucrhon.trace();

      if (_world.rank() == 0) print("rhon trace = ", rtrace);

      now = wall_time();

      _vnucrhon.truncate();

      _vnuc = apply(*_cop, _vnucrhon);

      if (_world.rank() == 0) printf("%f\n", wall_time() - now);

      if (_world.rank() == 0) print("Done creating nuclear potential ..\n");


      // WSTHORNTON

      rfunctionT vnuc2 = rfactoryT(_world).functor(rfunctorT(new

          MolecularPotentialFunctor(_mentity))).

          thresh(_params.thresh * 0.1).truncate_on_project();

      rfunctionT vnucdiff = _vnuc-vnuc2;

      double t1 = vnucdiff.trace();

      if (_world.rank() == 0) printf("Difference in nuclear potential: %15.8f\n\n", t1);

      for (int i = 0; i < 101; i++)

      {

        double dx = _params.L/100;

        double pt2 = -_params.L/2 + dx*i;

        coordT cpt(pt2);

        double val = vnucdiff(cpt);

        if (_world.rank() == 0) printf("%10.5f    %15.8f\n",pt2,val);

      }

      //MADNESS_ASSERT(false);

    }


    //*************************************************************************


    //*************************************************************************


    void make_nuclear_potential()

    {

      // Make coulomb operator

      _cop = CoulombOperatorPtr(_world, _params.lo, FunctionDefaults<3>::get_thresh() * 0.1);


      Tensor<double> csize = FunctionDefaults<3>::get_cell();

      if (_world.rank() == 0)

      {

        printf("Cell parameters\n");

        printf("------------------------------\n");

        print("cell(x) is ",csize(0,0), csize(0,1));

        print("cell(y) is ",csize(1,0), csize(1,1));

        print("cell(z) is ",csize(2,0), csize(2,1));

        printf("\n");

      }

      if (_params.ispotential) // potential

      {

        make_nuclear_potential_impl();

      }

      else // charge density

      {

        make_nuclear_charge_density_impl();

      }

    }


    //*************************************************************************


    //*************************************************************************


    struct GuessDensity : public FunctionFunctorInterface<double,3> {

        const MolecularEntity& mentity;

        const AtomicBasisSet& aobasis;

        double R;

        const bool periodic;


        double operator()(const coordT& x) const

        {

          double value = 0.0;

          if (periodic)

          {

            for (int xr = -2; xr <= 2; xr += 1)

            {

              for (int yr = -2; yr <= 2; yr += 1)

              {

                for (int zr = -2; zr <= 2; zr += 1)

                {

                  value += aobasis.eval_guess_density(mentity,

                      x[0]+xr*R, x[1]+yr*R, x[2]+zr*R);

                }

              }

            }

          }

          else

          {

            value = aobasis.eval_guess_density(mentity, x[0], x[1], x[2]);

          }

          return value;

        }


        GuessDensity(const MolecularEntity& mentity, const AtomicBasisSet& aobasis,

            const double& R, const bool& periodic)

        : mentity(mentity), aobasis(aobasis), R(R), periodic(periodic) {}


    };


    //*************************************************************************


    //*************************************************************************

    template <typename Q>


    void test_periodicity(const Function<Q,3>& f)

    {

      int npts = 101;

      double eps = 1e-8;

      coordT r(0.0);

      double delta = _params.L/(npts-1);

      double begin = -_params.L/2;

      double end = _params.L/2;

      double tol = 1e-6;

      // x-axis

      printf("periodicity along x-axis:  \n");

      printf("-------------------------------------------------------------\n\n");

      for (int i = 0; i < npts; i++)

      {

        printf("\n-------------------- edge --------------------\n");

        for (int j = 0; j < npts; j++)

        {

          coordT r1, r2, dr1, dr2;

          r1[0] = begin+eps; r1[1] = (i*delta)+begin; r1[2] = (j*delta)+begin;

          r2[0] = end-eps; r2[1] = (i*delta)+begin; r2[2] = (j*delta)+begin;

          dr1[0] = begin+2*eps; dr1[1] = (i*delta)+begin; dr1[2] = (j*delta)+begin;

          dr2[0] = end-2*eps; dr2[1] = (i*delta)+begin; dr2[2] = (j*delta)+begin;

          double val = std::abs(f(r1)-f(r2));

          std::string success = val < tol ? "PASS!" : "FAIL!";

          printf("%10.6f%10.6f%10.6f  %10.6f%10.6f%10.6f  %10.5e   %s\n",

              r1[0],r1[1],r1[2],r2[0],r2[1],r2[2],val,success.c_str());

        }

      }

      // y-axis

      printf("\nperiodicity along y-axis:  \n");

      printf("-------------------------------------------------------------\n\n");

      for (int i = 0; i < npts; i++)

      {

        printf("\n-------------------- edge --------------------\n");

        for (int j = 0; j < npts; j++)

        {

          coordT r1, r2, dr1, dr2;

          r1[0] = (i*delta)+begin; r1[1] = begin+eps; r1[2] = (j*delta)+begin;

          r2[0] = (i*delta)+begin; r2[1] = end-eps; r2[2] = (j*delta)+begin;

          dr1[0] = (i*delta)+begin; dr1[1] = begin+2*eps; dr1[2] = (j*delta)+begin;

          dr2[0] = (i*delta)+begin; dr2[1] = end-2*eps; dr2[2] = (j*delta)+begin;

          double val = std::abs(f(r1)-f(r2));

          std::string success = val < tol ? "PASS!" : "FAIL!";

          printf("%10.6f%10.6f%10.6f  %10.6f%10.6f%10.6f  %10.5e   %s\n",

              r1[0],r1[1],r1[2],r2[0],r2[1],r2[2],val,success.c_str());

        }

      }

      // z-axis

      printf("\nperiodicity along z-axis:  \n");

      printf("-------------------------------------------------------------\n\n");

      for (int i = 0; i < npts; i++)

      {

        printf("\n-------------------- edge --------------------\n");

        for (int j = 0; j < npts; j++)

        {

          coordT r1, r2, dr1, dr2;

          r1[0] = (i*delta)+begin; r1[1] = (j*delta)+begin; r1[2] = begin+eps;

          r2[0] = (i*delta)+begin; r2[1] = (j*delta)+begin; r2[2] = end-eps;

          dr1[0] = (i*delta)+begin; dr1[1] = (j*delta)+begin; dr1[2] = begin+2*eps;

          dr2[0] = (i*delta)+begin; dr2[1] = (j*delta)+begin; dr2[2] = end-2*eps;

          double val = std::abs(f(r1)-f(r2));

          std::string success = val < tol ? "PASS!" : "FAIL!";

          printf("%10.6f%10.6f%10.6f  %10.6f%10.6f%10.6f  %10.5e   %s\n",

              r1[0],r1[1],r1[2],r2[0],r2[1],r2[2],val,success.c_str());

        }

      }

    }


    //*************************************************************************


    //*************************************************************************

    rfunctionT


    make_lda_potential(World& world,

                       const rfunctionT& arho,

                       const rfunctionT& brho,

                       const rfunctionT& adelrhosq,

                       const rfunctionT& bdelrhosq)

    {

  //      MADNESS_ASSERT(!_params.spinpol);

        rfunctionT vlda = copy(arho);

//        vlda.unaryop(&::libxc_ldaop<double>);

        vlda.unaryop(&::ldaop<double>);

        return vlda;

    }


    vecfuncT project_ao_basis(World& world, KPoint kpt) {

        vecfuncT ao(_aobasis.nbf(_mentity));


//        Level initial_level = 3;

//        for (int i=0; i < _aobasis.nbf(_mentity); i++) {

//          functorT aofunc(new AtomicBasisFunctor(_aobasis.get_atomic_basis_function(_mentity,i),

//              _params.L, _params.periodic, kpt));

//            ao[i] = factoryT(world).functor(aofunc).initial_level(initial_level).truncate_on_project().nofence();

//        }

//        world.gop.fence();


//        WSTAtomicBasisFunctor aofunc(_aobasis.get_atomic_basis_function(_mentity,4),

//            _params.L, kpt.k[0], kpt.k[1], kpt.k[2]);

//        coord_3d p(5e-2);

//        double_complex val = aofunc(p);

//        print("AO_PROJECT: val is ", val);

//        MADNESS_ASSERT(false);


        for (int i=0; i < _aobasis.nbf(_mentity); i++) {

          functorT aofunc(new WSTAtomicBasisFunctor(_aobasis.get_atomic_basis_function(_mentity,i),

              _params.L, kpt.k[0], kpt.k[1], kpt.k[2]));

            ao[i] = factoryT(world).functor(aofunc).truncate_on_project().truncate_mode(0);

        }

        world.gop.fence();


//        std::vector<double> norms;

//        norms = norm2s(world, ao);

//        for (int i=0; i<_aobasis.nbf(_mentity); i++) {

//            if (world.rank() == 0 && fabs(norms[i]-1.0)>1e-3) print(i," bad ao norm?", norms[i]);

//            norms[i] = 1.0/norms[i];

//        }

//

//        scale(world, ao, norms);

//        norms = norm2s(world, ao);

//        for (int i=0; i<_aobasis.nbf(_mentity); i++) {

//            if (world.rank() == 0 && fabs(norms[i]-1.0)>1e-3) print(i," bad ao norm?", norms[i]);

//            norms[i] = 1.0/norms[i];

//        }

//        scale(world, ao, norms);


        return ao;

    }


    //*************************************************************************


    //*************************************************************************

    // Constructor


    Solver(World& world,

           rfunctionT vnucrhon,

           vecfuncT phisa,

           vecfuncT phisb,

           std::vector<T> eigsa,

           std::vector<T> eigsb,

           ElectronicStructureParams params,

           MolecularEntity mentity)

       : _world(world), _vnucrhon(vnucrhon), _phisa(phisa), _phisb(phisb),

       _eigsa(eigsa), _eigsb(eigsb), _params(params), _mentity(mentity)

    {

      _residual = 1e5;

      _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);


      if (params.ispotential)

      {

        _vnuc = copy(_vnucrhon);

      }

      else

      {

        _vnuc = apply(*_cop, _vnucrhon);

      }

    }


    //*************************************************************************


    /// Initializes alpha and beta mos, occupation numbers, eigenvalues

    //*************************************************************************


    void initial_guess()

    {

      // Get initial guess for the electronic density

      if (_world.rank() == 0) print("Guessing rho ...\n\n");


      rfunctionT rho = rfactoryT(_world);

      if (_params.restart == 0)

      {

        rho = rfactoryT(_world).functor(rfunctorT(new GuessDensity(_mentity,

              _aobasis, _params.L, _params.periodic))).initial_level(3);

      }

      else

      {

        MADNESS_EXCEPTION("restart not working right now!",0);

      }

      // This is a cheat

      rho.scale(_params.ncharge/rho.trace());


      char fname3[25];

      coord_3d rp1(-_params.L/2);

      coord_3d rp2(_params.L/2);

      plot_line(fname3,101,rp1,rp2,rho);


      // load balance

      //if(_world.size() > 1) {

      //    START_TIMER(_world);

      //    LoadBalanceDeux<3> lb(_world);

      //    lb.add_tree(_vnuc, lbcost<double,3>(1.0, 0.0), false);

      //    lb.add_tree(rho, lbcost<double,3>(1.0, 1.0), true);


      //    FunctionDefaults<3>::redistribute(_world, lb.load_balance(6.0));

      //}


      if (_params.restart != 1)

      {

        // build effective potential

        rfunctionT vlocal;

        // Is this a many-body system?

        if (_params.ncharge > 1.0)

        {

          if (_world.rank() == 0) print("Creating Coulomb op ...\n\n");

          SeparatedConvolution<double, 3>* op = 0;

          // Is this system periodic?

          if (_params.periodic)

          {

            Tensor<double> cellsize = FunctionDefaults<3>::get_cell_width();

            //op = PeriodicCoulombOpPtr<double, 3> (_world, _params.waveorder,

            //    _params.lo, _params.thresh * 0.1, cellsize);

            op = CoulombOperatorPtr(_world, _params.lo, _params.thresh * 0.1);

          }

          else

          {

            op = CoulombOperatorPtr(_world, _params.lo, _params.thresh * 0.1);

          }

          if (_world.rank() == 0) print("Building effective potential ...\n\n");

          rfunctionT vc = apply(*op, rho);

          vlocal = _vnuc + vc; //.scale(1.0-1.0/nel); // Reduce coulomb to increase binding

          rho.scale(0.5);

          // WSTHORNTON

          _rhoa = rho;

          _rhob = rho;

          // Do the LDA

          rfunctionT vlda = make_lda_potential(_world, rho, rho, rfunctionT(), rfunctionT());

          vlocal = vlocal + vlda;

          delete op;

        }

        else

        {

          vlocal = _vnuc;

        }


        // Clear these functions

//        rho.clear();

        vlocal.reconstruct();


        // Get size information from k-points and ao_basis so that we can correctly size

        // the _orbitals data structure and the eigs tensor

        // number of orbitals in the basis set

        int _nao = _aobasis.nbf(_mentity);


        // number of kpoints

        int nkpts = _kpoints.size();

        // total number of orbitals to be processed (no symmetry)

        int norbs = _params.nbands * nkpts;

        // Check to see if the basis set can accomodate the number of bands

        if (_params.nbands > _nao)

          MADNESS_EXCEPTION("Error: basis not large enough to accomodate number of bands", _nao);

        // set the number of orbitals

        _eigsa = std::vector<double>(norbs, 0.0);

        _eigsb = std::vector<double>(norbs, 0.0);

        _occsa = std::vector<double>(norbs, 0.0);

        _occsb = std::vector<double>(norbs, 0.0);

        if (_world.rank() == 0) print("Building kinetic energy matrix ...\n\n");

        // Need to do kinetic piece for every k-point

        for (int ki = 0; ki < nkpts; ki++)

        {

          // These are our initial basis functions

          if (_world.rank() == 0) print("Projecting atomic orbitals ...\n\n");

          START_TIMER(_world);

          cvecfuncT ao = project_ao_basis(_world, _kpoints[ki]);

          END_TIMER(_world, "projecting atomic orbital basis");

//          for (unsigned int iao = 0; iao < _nao; iao)

//          {

//            _aobasisf.push_back(ao[iao]);

//          }


          for (unsigned int ai = 0; ai < ao.size(); ai++)

          {

            std::vector<long> npt(3,101);

            char fnamedx[50];

            sprintf(fnamedx, "aofunc_k_%2.2d__%2.2d__.dx",ki,ai);

            std::vector<long> npt2(3,101);

            plotdx(ao[ai], fnamedx, FunctionDefaults<3>::get_cell(), npt2);

          }


          coord_3d p1(-_params.L/2);

          coord_3d p2(_params.L/2);

          for (int i = 0; i < ao.size(); i++)

          {

            char fname[25];

            sprintf(fname, "ao_line_%d.txt",i);

            plot_line(fname,101,p1,p2,ao[i]);

          }

          char fname2[25];

          sprintf(fname2, "vnuc_line.txt");

          plot_line(fname2,101,p1,p2,_vnuc);

          char fname3[25];

          sprintf(fname3, "vlocal_line.txt");

          plot_line(fname3,101,p1,p2,vlocal);


          // load balancing

          //if(_world.size() > 1)

          //{

          //  LoadBalanceDeux<3> lb(_world);

          //  lb.add_tree(_vnuc, lbcost<double,3>(1.0, 1.0), false);

          //  for(unsigned int i = 0; i < ao.size(); i++)

          //  {

          //      lb.add_tree(ao[i], lbcost<valueT,3>(1.0, 1.0), false);

          //  }


          //  FunctionDefaults<3>::redistribute(_world, lb.load_balance(6.0));

          //}


          // Get k-point from list

          KPoint& kpoint = _kpoints[ki];


          // WSTHORNTON

//          ctensorT S = matrix_inner(_world,ao,ao,true);

//          print(S);

//          ctensorT U = csqrt(S);

//          ao = transform(_world, ao, U, _params.thresh, true);


          // Build kinetic matrx

          //ctensorT kinetic = ::kinetic_energy_matrix_slow<T,NDIM>(_world, ao, _params.periodic, kpt);

          ctensorT kinetic = ::kinetic_energy_matrix_slow<T,NDIM>(_world, ao, _params.periodic, kpoint);

          // Build the overlap matrix

          if (_world.rank() == 0) print("Building overlap matrix ...\n\n");

          ctensorT overlap = matrix_inner(_world, ao, ao, true);

          // Build the potential matrix

          reconstruct(_world, ao);

          if (_world.rank() == 0) print("Building potential energy matrix ...\n\n");

          //cvecfuncT vpsi = mul_sparse(_world, vlocal, ao, _params.thresh);

          cvecfuncT vpsi;

          for (int i = 0; i < ao.size(); i++)

            vpsi.push_back(vlocal*ao[i]);

          _world.gop.fence();

          compress(_world, vpsi);

          truncate(_world, vpsi);

          compress(_world, ao);

          // Build the potential matrix

          ctensorT potential = matrix_inner(_world, vpsi, ao, true);

          _world.gop.fence();

          // free memory

          vpsi.clear();

          _world.gop.fence();


          // Construct and diagonlize Fock matrix

          ctensorT fock = potential + kinetic;

          ctensorT fockzero = fock-conj_transpose(fock);

          if (_world.rank() == 0)

          {

            print("Kinetic:");

            print(kinetic);

            print("Potential:");

            print(potential);

            print("Fock: (pre-symmetrized)");

            print(fock);

            print("FockZero: (should be zero)");

            print(fockzero);

            print("Overlap:");

            print(overlap);

          }

          fock = 0.5 * (fock + conj_transpose(fock));

          for (unsigned int i = 0; i < fock.dim(0); i++)

          {

            fock(i,i) += i*_params.thresh*0.1;

          }


          ctensorT c; rtensorT e;

          sygv(fock, overlap, 1, c, e);


          // diagonlize kinetic

          ctensorT ck; rtensorT ek;

          sygv(kinetic, overlap, 1, ck, ek);

          // diagonalize potential

          ctensorT cp; rtensorT ep;

          sygv(potential, overlap, 1, cp, ep);

          // diagonalize overlap

          ctensorT co; rtensorT eo;

          syev(overlap, co, eo);


          if (_world.rank() == 0)

          {

            print("fock eigenvectors dims:",c.dim(0),c.dim(1));

            print("fock eigenvectors:");

            print(c);

          }


          if (_world.rank() == 0)

          {

            print("kinetic eigenvalues");

            print(ek);

          }


          if (_world.rank() == 0)

          {

            print("potential eigenvalues");

            print(ep);

          }


          if (_world.rank() == 0)

          {

            print("overlap eigenvalues");

            print(eo);

          }

          if (_world.rank() == 0)

          {

            print("fock eigenvalues");

            print(e);

          }


          if (_world.rank() == 0)

          {

            printf("Overlap: \n");

            for (int i = 0; i < overlap.dim(0); i++)

                {

                    for (int j = 0; j < overlap.dim(1); j++)

                        {

                            printf("%10.5f", real(overlap(i,j)));

                        }

                    printf("\n");

                }

            printf("\n");

            printf("\n");

          }


          compress(_world, ao);

          _world.gop.fence();

          // Take linear combinations of the gaussian basis orbitals as the starting

          // orbitals for solver

          vecfuncT tmp_orbitals = transform(_world, ao, c(_, Slice(0, _nao - 1)));


//          tmp_orbitals[0] = ao[0];

//          tmp_orbitals[1] = ao[1];

//          tmp_orbitals[2] = ao[2];

//          tmp_orbitals[3] = ao[3];

//          tmp_orbitals[4] = ao[4];


          // WSTHORNTON

          // checking the symmetry

//          int npts = 101;

//          double delta = _params.L/(npts-1);

//          double begin = -_params.L/2;

//          double end = _params.L/2;

//          double tol = 1e-6;

//

//          for (int i = 0; i < npts; i++)

//          {

//            double x = (i*delta)+begin;

//            for (int j = 0; j < npts; j++)

//            {

//              double y = (j*delta)+begin;

//              for (int k = 0; k < npts; k++)

//              {

//                double z = (k*delta)+begin;

//                coord_3d r1 {x,y,z};

//                coord_3d r2 {y,x,z};

//                coord_3d r3 {z,y,x};

//                coord_3d r4 {x,z,y};

//                double_complex pxr2 = ao[2](r2); double_complex pyr1 = ao[3](r1);

//                double_complex pxr3 = ao[2](r3); double_complex pzr1 = ao[4](r1);

//                double_complex pyr4 = ao[3](r4);

//                double err_xy = std::abs(pxr2-pyr1);

//                double err_xz = std::abs(pxr3-pzr1);

//                std::string success = err_xy < tol ? "PASS!" : "FAIL!";

//                printf("%10.4e + %10.4e     %10.4e + %10.4e     %15.8e\n     %s\n",

//                    std::real(pxr2), std::imag(pxr2), std::real(pyr1), std::imag(pyr1),

//                    err_xy, success.c_str());

//              }

//            }

//          }


//          MADNESS_ASSERT(false);


          // WSTHORNTON

//          const double PI_OVER_8 = madness::constants::pi/8;

//          SeparatedConvolution<double,3> op = CoulombOperator(_world, _params.lo, _params.thresh * 0.1);

//          rfunctionT vlda = make_lda_potential(_world, rho, rho, rfunctionT(), rfunctionT());

//          rho.scale(2.0);

//          rfunctionT vc2 = apply(op,rho);

//          double rtr2 = rho.trace();

//          rfunctionT vlocal2 = vc2 + _vnuc;

//

//          SeparatedConvolution<double,3> op2 = CoulombOperator(_world, _params.lo, _params.thresh * 0.1);

//          SeparatedConvolution<double,3> bshop = BSHOperator3D(_world, -0.2, _params.lo, _params.thresh * 0.1);


//          if (_world.rank() == 0)

//          {

//            print("trace of rho:");

//            print(rtr2);

//          }

//          for (int i = 0; i < 5; i++)

//          {

//            double th = i*PI_OVER_8;

//            tmp_orbitals[2] = ao[2];

//            tmp_orbitals[3] = cos(th)*ao[3] + sin(th)*ao[4];

//            tmp_orbitals[4] = -sin(th)*ao[3] + cos(th)*ao[4];

//

//            ctensorT fred(3,3);

//            for (int ii = 2; ii < 5; ii++)

//            {

//              for (int jj = 2; jj < 5; jj++)

//              {

//                fred(ii-2,jj-2) = inner(tmp_orbitals[ii], _vnuc*tmp_orbitals[jj]);

//                if (std::abs(fred(ii-2,jj-2)) < 1e-6)

//                  fred(ii-2,jj-2) = std::complex<double>(0.0,0.0);

//

//              }

//            }


//            complex_derivative_3d Dx(_world,0);

//            complex_derivative_3d Dy(_world,1);

//            complex_derivative_3d Dz(_world,2);

//

//            ctensorT fred(3,3);

//            std::complex<double> I = std::complex<double>(0.0,1.0);

//            std::complex<double> one = std::complex<double>(1.0,0.0);

//            for (int ii = 2; ii < 5; ii++)

//            {

//              for (int jj = 2; jj < 5; jj++)

//              {

//                double ksq = kpoint.k[0]*kpoint.k[0] +

//                    kpoint.k[1]*kpoint.k[1] +

//                    kpoint.k[2]*kpoint.k[2];

//

//                cfunctionT ct1 = -I*kpoint.k[0]*Dx(tmp_orbitals[jj]) -

//                  I*kpoint.k[1]*Dy(tmp_orbitals[jj]) -

//                  I*kpoint.k[2]*Dz(tmp_orbitals[jj]);

//

//                cfunctionT ct2 = -0.5*Dx(Dx(tmp_orbitals[jj])) +

//                    Dy(Dy(tmp_orbitals[jj])) +

//                    Dz(Dz(tmp_orbitals[jj]));

//

//                cfunctionT ct3 = 0.5*ksq*tmp_orbitals[jj];

//

//                fred(ii-2,jj-2) = inner(tmp_orbitals[ii], ct1+ct2+ct3);

//                if (std::abs(fred(ii-2,jj-2)) < 1e-6)

//                  fred(ii-2,jj-2) = std::complex<double>(0.0,0.0);

//              }

//            }


//            ctensorT cf; rtensorT ef;

//            syev(fred, cf, ef);

//

//            if (_world.rank() == 0)

//            {

//                print("Fred:", i);

//                print(fred);

//                print("eigenvalues:");

//                print(ef);

//                print("eigenvectors:");

//                print(cf);

//            }

//          }

//          MADNESS_ASSERT(false);


          _world.gop.fence();

          truncate(_world, tmp_orbitals);

          normalize(_world, tmp_orbitals);


          // Build the overlap matrix

          if (_world.rank() == 0) print("Building overlap matrix ...\n\n");

          ctensorT overlap2 = matrix_inner(_world, tmp_orbitals, tmp_orbitals, true);


          rtensorT tmp_eigs = e(Slice(0, _nao - 1));


          if (_world.rank() == 0) printf("(%8.4f,%8.4f,%8.4f)\n",kpoint.k[0], kpoint.k[1], kpoint.k[2]);

          if (_world.rank() == 0) print(tmp_eigs);

          if (_world.rank() == 0) print("\n");


          //if (_world.rank() == 0) print("kinetic energy for kp = ", kp);

          //if (_world.rank() == 0) print(kinetic);

          //if (_world.rank() == 0) print("\n");


          // DEBUG

          if (_world.rank() == 0) {

              printf("Overlap: \n");

              for (int i = 0; i < kinetic.dim(0); i++)

                  {

                      for (int j = 0; j < kinetic.dim(1); j++)

                          {

                              printf("%10.5f", real(overlap(i,j)));

                          }

                      printf("\n");

                  }

              printf("\n");

              printf("\n");


              printf("Kinetic: \n");

              for (int i = 0; i < kinetic.dim(0); i++)

                  {

                      for (int j = 0; j < kinetic.dim(1); j++)

                          {

                              printf("%10.5f", real(kinetic(i,j)));

                          }

                      printf("\n");

                  }

              printf("\n");

              printf("\n");


              printf("V: \n");

              for (int i = 0; i < potential.dim(0); i++)

                  {

                      for (int j = 0; j < potential.dim(1); j++)

                          {

                              printf("%10.5f", real(potential(i,j)));

                          }

                      printf("\n");

                  }

              printf("\n");

              printf("\n");


              printf("Fock: \n");

              for (int i = 0; i < fock.dim(0); i++)

                  {

                      for (int j = 0; j < fock.dim(1); j++)

                          {

                              printf("%10.5f", real(fock(i,j)));

                          }

                      printf("\n");

                  }

              printf("\n");

              printf("\n");


              printf("New overlap: \n");

              for (int i = 0; i < overlap2.dim(0); i++)

                  {

                      for (int j = 0; j < overlap2.dim(1); j++)

                          {

                              printf("%10.5f", real(overlap2(i,j)));

                          }

                      printf("\n");

                  }

              printf("\n");

              printf("\n");

          }


          // Fill in orbitals and eigenvalues

          kpoint.begin = ki*_params.nbands;

          kpoint.end = (ki+1)*_params.nbands;

          for (unsigned int oi = kpoint.begin, ti = 0; oi < kpoint.end; oi++, ti++)

          {

            //if (_world.rank() == 0) print(oi, ti, kpt.begin, kpt.end);

            // normalize the orbitals

            //tmp_orbitals[ti].scale(1.0/tmp_orbitals[ti].norm2());

            _phisa.push_back(tmp_orbitals[ti]);

            _phisb.push_back(tmp_orbitals[ti]);

            _eigsa[oi] = tmp_eigs[ti];

            _eigsb[oi] = tmp_eigs[ti];

          }

        }

      }

    }


    //*************************************************************************


    //*************************************************************************

    // Constructor


    Solver(World& world,

           const rfunctionT& vnucrhon,

           const vecfuncT& phis,

           const std::vector<T>& eigs,

           const ElectronicStructureParams& params,

           MolecularEntity mentity)

       : _world(world), _vnucrhon(vnucrhon), _phisa(phis), _phisb(phis),

       _eigsa(eigs), _eigsb(eigs), _params(params), _mentity(mentity)

    {

      _residual = 1e5;

      if (params.periodic)

      {

        Tensor<double> box = FunctionDefaults<NDIM>::get_cell_width();

        //_cop = PeriodicCoulombOpPtr<T,NDIM>(const_cast<World&>(world),

        //    FunctionDefaults<NDIM>::get_k(), params.lo, params.thresh * 0.1, box);

        _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

      }

      else

      {

        _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

      }


      if (params.ispotential)

      {

        _vnuc = copy(_vnucrhon);

      }

      else

      {

        _vnuc = apply(*_cop, _vnucrhon);

      }

    }


    //*************************************************************************


    //*************************************************************************

    // Constructor


    Solver(World& world,

           rfunctionT vnucrhon,

           vecfuncT phis,

           std::vector<T> eigs,

           std::vector<KPoint> kpoints,

           std::vector<double> occs,

           ElectronicStructureParams params,

           MolecularEntity mentity)

       : _world(world), _vnucrhon(vnucrhon), _phisa(phis), _phisb(phis),

         _eigsa(eigs), _eigsb(eigs), _params(params),

         _kpoints(kpoints), _occsa(occs), _occsb(occs), _mentity(mentity)

    {

      _residual = 1e5;

      if (params.periodic)

      {

        Tensor<double> box = FunctionDefaults<NDIM>::get_cell_width();

        _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

      }

      else

      {

        _cop = CoulombOperatorPtr(const_cast<World&>(world), params.lo, params.thresh * 0.1);

      }


      if (params.ispotential)

      {

        _vnuc = copy(_vnucrhon);

      }

      else

      {

        _vnuc = apply(*_cop, _vnucrhon);

      }

    }


    //*************************************************************************


    //*************************************************************************


    virtual ~Solver()

    {

      _outputF.close();

      _matF.close();

      _eigF.close();

      delete _subspace;

    }


    //*************************************************************************


    //***************************************************************************

    // set occupation numbers (only for insulators ... no smearing)


    void set_occs2(const std::vector<KPoint>& kpoints,

                   const std::vector<double>& eigsa,

                   const std::vector<double>& eigsb,

                   std::vector<double>& occsa,

                   std::vector<double>& occsb)

    {

      for (unsigned int ik = 0; ik < kpoints.size(); ik++)

      {

        // get k-point

        KPoint k = kpoints[ik];


        // pull subset of data that corresponds to k

        const std::vector<double> k_eigsa(eigsa.begin() + k.begin, eigsa.begin() + k.end);

        const std::vector<double> k_eigsb(eigsb.begin() + k.begin, eigsb.begin() + k.end);

        std::vector<double> k_occsa(occsa.begin() + k.begin, occsa.begin() + k.end);

        std::vector<double> k_occsb(occsb.begin() + k.begin, occsb.begin() + k.end);


        // demand all vectors have the same size

        unsigned int sz = k_eigsa.size();

        MADNESS_ASSERT(k_eigsb.size() == sz);

        MADNESS_ASSERT(k_occsa.size() == sz);

        MADNESS_ASSERT(k_occsb.size() == sz);

        // concatenate eigenvalues

        std::vector<double> teigs;

        //std::copy(k_eigsa.begin(), k_eigsa.end(), teigs.begin());

        //teigs.insert(teigs.end(), k_eigsb.begin(), k_eigsb.end());

        //std::copy(k_eigsb.begin(), k_eigsb.end(), back_inserter(teigs));

        for (unsigned int ist = 0; ist < k_eigsa.size(); ist++) teigs.push_back(k_eigsa[ist]);

        for (unsigned int ist = 0; ist < k_eigsb.size(); ist++) teigs.push_back(k_eigsb[ist]);


        if (_world.rank() == 0) printf("setting occs ....\n\n");

        for (unsigned int ist = 0; ist < teigs.size(); ist++)

        {

          if (_world.rank() == 0)

          {

            printf("%5d    %15.8f\n", ist, teigs[ist]);

          }

        }


        // indicies

        std::vector<unsigned int> inds(2*sz);

        for (unsigned int i = 0; i < 2*sz; i++) inds[i] = i;

        // sort by eigenvalue

        for (unsigned int i = 0; i < 2*sz; i++)

        {

          for (unsigned int j = i+1; j < 2*sz; j++)

          {

            if (teigs[j] < teigs[i])

            {

              double t1 = teigs[i];

              teigs[i] = teigs[j];

              teigs[j] = t1;

              int it1 = inds[i];

              inds[i] = inds[j];

              inds[j] = it1;

            }

          }

        }


        if (_world.rank() == 0)

          printf("\nSorted eigenvalues:\n");

        for (unsigned int i = 0; i < teigs.size(); i++)

        {

          if (_world.rank() == 0)

            printf("%10d%10d     %15.8f\n",i,inds[i],teigs[i]);

        }


        // assign occupation numbers

        double availablecharge = _params.ncharge;

        for (unsigned int i = 0; (i < 2*sz) && (availablecharge > 0.0) ; i++)

        {

          unsigned int current = inds[i];

          if (current >= sz)

          {

            current -= sz;

            k_occsb[current] = 1.0;

            availablecharge -= 1.0;

          }

          else

          {

            k_occsa[current] = 1.0;

            availablecharge -= 1.0;

          }

        }


        for (unsigned int ik1 = k.begin, ik2 = 0; ik1 < k.end; ik1++,ik2++)

        {

          occsa[ik1] = k_occsa[ik2];

          occsb[ik1] = k_occsb[ik2];

        }

      }


      for (unsigned int ik = 0; ik < kpoints.size(); ik++)

      {

        KPoint k = kpoints[ik];

        if (_world.rank() == 0)

        {

          printf("k-point is: %d: \n",ik);

        }

        for (unsigned int ist = k.begin; ist < k.end; ist++)

        {

          if (_world.rank() == 0)

          {

            printf("occa:    %12.5f          occb:    %12.5f \n",occsa[ist],occsb[ist]);

          }

        }

      }


    }


    //***************************************************************************


    //***************************************************************************

    /*!

     \ingroup periodic_solver

     \brief Compute the electronic density for either a molecular or periodic

            system.

     */


    rfunctionT compute_rho_slow(const vecfuncT& phis, std::vector<KPoint> kpoints,

                               std::vector<double> occs)

    {

      // Electron density

      rfunctionT rho = rfactoryT(_world);

      _world.gop.fence();

      if (_world.rank() == 0) _outputF << "computing rho ..." << endl;

      // Loop over k-points

      for (unsigned int kp = 0; kp < kpoints.size(); kp++)

      {

        // get k-point

        KPoint kpoint = kpoints[kp];

        // loop through bands

        for (unsigned int j = kpoint.begin; j < kpoint.end; j++)

        {

          // Get phi(j) from iterator

          const functionT& phij = phis[j];

          // Compute the j-th density

          //rfunctionT prod = abs_square(phij);

          rfunctionT prod = abssq(phij,true);

          double rnrm = prod.trace();

          prod.scale(1/rnrm);

//          rho += 0.5 * _occs[j] * kpoint.weight * prod;

          rho += occs[j] * kpoint.weight * prod;

        }

      }

      rho.truncate();


      return rho;

    }


    // computes the electronic density for 1 spin


    rfunctionT compute_rho(const vecfuncT& phis, std::vector<KPoint> kpoints,

                          std::vector<double> occs)

    {

      if (_world.rank() == 0) _outputF << "computing rho ..." << endl;

      rfunctionT rho = rfactoryT(_world);       // Electron density


      reconstruct(_world, phis); // For max parallelism

      std::vector<rfunctionT> phisq(phis.size());

      for (unsigned int i=0; i<phis.size(); i++) {

          phisq[i] = abssq(phis[i],false);

      }

      _world.gop.fence();

      std::vector<double> phinorm = norm2s(_world, phis);


      compress(_world,phisq); // since will be using gaxpy for accumulation

      rho.compress();


      // Loop over k-points

      for (unsigned int kp = 0; kp < kpoints.size(); kp++)

      {

        // get k-point

        KPoint kpoint = kpoints[kp];

        // loop through bands

        for (unsigned int j = kpoint.begin; j < kpoint.end; j++)

        {

          rho.gaxpy(1.0, phisq[j], occs[j] * kpoint.weight / (phinorm[j]*phinorm[j]), false);

        }

      }

      _world.gop.fence();

      phisq.clear();

      rho.truncate();


      return rho;

    }


    //***************************************************************************


    //***************************************************************************


    std::vector<poperatorT> make_bsh_operators(const std::vector<T>& eigs)

    {

      // Make BSH vector

      std::vector<poperatorT> bops;

      // Get defaults

      double tol = FunctionDefaults<NDIM>::get_thresh();

      // Loop through eigenvalues, adding a BSH operator to bops

      // for each eigenvalue

      int sz = eigs.size();

      for (int i = 0; i < sz; i++)

      {

          T eps = eigs[i];

          if (eps > 0)

          {

              if (_world.rank() == 0)

              {

                  std::cout << "bsh: warning: positive eigenvalue" << i << eps << endl;

              }

              eps = -0.1;

          }


          bops.push_back(poperatorT(BSHOperatorPtr3D(_world, sqrt(-2.0*eps), _params.lo, tol * 0.1)));

      }

      return bops;

    }


    //*************************************************************************


    //*************************************************************************

//    void loadbal()

//    {

//        if(_world.size() == 1)

//            return;

//

//        LoadBalanceDeux<3> lb(_world);

//        lb.add_tree(_vnuc, lbcost<double,3>(1.0, 0.0), false);

//        lb.add_tree(_rhoa, lbcost<double,3>(1.0, 1.0), false);

//        for(unsigned int i = 0;i < _phisa.size();i++)

//        {

//            lb.add_tree(_phisa[i], lbcost<valueT,3>(1.0, 1.0), false);

//        }

//        if(_params.spinpol)

//        {

//            lb.add_tree(_rhob, lbcost<double,3>(1.0, 1.0), false);

//            for(unsigned int i = 0;i < _phisb.size();i++)

//            {

//                lb.add_tree(_phisa[i], lbcost<valueT,3>(1.0, 1.0), false);

//            }

//        }

//

//        FunctionDefaults<3>::redistribute(_world, lb.load_balance(6.0));

//   }

   //*************************************************************************


    //*************************************************************************


    double calculate_kinetic_energy()

    {

      double ke = 0.0;

      if (!_params.periodic)

      {

        complex_derivative_3d Dx(_world,0);

        complex_derivative_3d Dy(_world,1);

        complex_derivative_3d Dz(_world,2);

        for (unsigned int i = 0; i < _phisa.size(); i++)

        {

          functionT dpdx = Dx(_phisa[i]);

          functionT dpdy = Dy(_phisa[i]);

          functionT dpdz = Dz(_phisa[i]);

          ke += 0.5 * (real(inner(dpdx,dpdx)) + real(inner(dpdy,dpdy))

              + real(inner(dpdz,dpdz)));

        }

        if (_params.spinpol)

        {

          for (unsigned int i = 0; i < _phisb.size(); i++)

          {

            functionT dpdx = Dx(_phisb[i]);

            functionT dpdy = Dy(_phisb[i]);

            functionT dpdz = Dz(_phisb[i]);

            ke += 0.5 * (real(inner(dpdx,dpdx)) + real(inner(dpdy,dpdy))

                + real(inner(dpdz,dpdz)));

          }

        }

        else

        {

          ke *= 2.0;

        }

      }

      return ke;

    }


    //*************************************************************************


    //*************************************************************************

    /*!

     \ingroup periodic_solver

     \brief Applies the LDA effective potential to each orbital. Currently only

            lda and spin-polarized is not implemented.

     */


    void apply_potential(vecfuncT& pfuncsa,

        vecfuncT& pfuncsb, const vecfuncT& phisa,

        const vecfuncT& phisb, const rfunctionT& rhoa, const rfunctionT& rhob,

        const rfunctionT& rho)

    {

      // Nuclear and coulomb potentials

      rfunctionT vc = apply(*_cop, rho);


      // combined density

      rfunctionT rho2 = rho + _vnucrhon;

      double vnucrhontrace = _vnucrhon.trace();

      double rhotrace = rho.trace();

      double rho2trace = rho2.trace();

      if (_world.rank() == 0) printf("_vnucrhon trace: %10e\n", vnucrhontrace);

      if (_world.rank() == 0) printf("rho trace: %10e\n", rhotrace);

      if (_world.rank() == 0) printf("rho2 trace: %10e\n", rho2trace);

      rfunctionT vlocal = (_params.ispotential) ? _vnuc + vc : apply(*_cop, rho2);

      rfunctionT vlocal2 = _vnuc + vc;

      double vlerr = (vlocal-vlocal2).norm2();

      if (_world.rank() == 0) printf("vlerr trace: %10e\n\n", vlerr);


      // Calculate energies for Coulomb and nuclear

      double ce = 0.5*inner(vc,rho);

      double pe = inner(_vnuc,rho);

      double xc = 0.0;

      double ke = calculate_kinetic_energy();

      // Exchange

      if (_params.functional == 1)

      {

        // LDA, is calculation spin-polarized?

        if (_params.spinpol)

        {

            MADNESS_EXCEPTION("Spin polarized not implemented!",0);

//          // potential

//          rfunctionT vxca = binary_op(rhoa, rhob, &::libxc_ldaop_sp<double>);

//          rfunctionT vxcb = binary_op(rhob, rhoa, &::libxc_ldaop_sp<double>);

//          pfuncsa = mul_sparse(_world, vlocal + vxca, phisa, _params.thresh * 0.1);

//          pfuncsb = mul_sparse(_world, vlocal + vxcb, phisb, _params.thresh * 0.1);

//          // energy

//          rfunctionT fca = binary_op(rhoa, rhob, &::libxc_ldaeop_sp<double>);

//          rfunctionT fcb = binary_op(rhob, rhoa, &::libxc_ldaeop_sp<double>);

//          xc = fca.trace() + fcb.trace();

        }

        else

        {

          // potential

          rfunctionT vxc = copy(rhoa);

//          vxc.unaryop(&::libxc_ldaop<double>);

          START_TIMER(_world);

          vxc.unaryop(&::ldaop<double>);


          //test_periodicity(vc);

//          for (unsigned int i = 0; i < phisa.size(); i++)

//          {

//            test_periodicity(phisa[i]);

//          }


          pfuncsa = mul_sparse(_world, vlocal2+vxc, phisa, _params.thresh * 0.1);

//          rfunctionT vxc2 = binary_op(rhoa, rhoa, &::libxc_ldaop_sp<double>);

//          pfuncsa = mul_sparse(_world, vlocal + vxc2, phisa, _params.thresh * 0.1);


//          for (unsigned int i = 0; i < pfuncsa.size(); i++)

//          {

//            test_periodicity(pfuncsa[i]);

//          }


          END_TIMER(_world,"Applying LDA potential");

          // energy

          rfunctionT fc = copy(rhoa);

          fc.unaryop(&::ldaeop<double>);

          xc = fc.trace();

        }

      }

      else if (_params.functional == 2)

      {

        START_TIMER(_world);

        pfuncsa = mul_sparse(_world, vlocal, phisa, _params.thresh * 0.1);

        END_TIMER(_world,"Applying local potential");

        START_TIMER(_world);

        // gamma-point?

        if ((_params.ngridk0 == 1) && (_params.ngridk1 == 1) && (_params.ngridk2 == 1))

        {

          apply_hf_exchange3(_phisa, _phisb, pfuncsa, pfuncsb, xc);

        }

        else

        {

          apply_hf_exchange4(_phisa, _phisb, pfuncsa, pfuncsb, xc);

        }

        END_TIMER(_world, "Applying HF exchange");

      }

      std::cout.precision(8);

      if (_world.rank() == 0)

      {

        printf("Energies:\n");

        printf("Kinetic energy:     %20.10f\n", ke);

        printf("Potential energy:   %20.10f\n", pe);

        printf("Coulomb energy:     %20.10f\n", ce);

        printf("Exchange energy:    %20.10f\n", xc);

        printf("Total energy:       %20.10f\n\n", ke + pe + ce + xc);

      }

    }


    //*************************************************************************


    // working for a molecule / atom ... need to test with periodic boundary

    // conditions as a gamma point only calculation

    //*************************************************************************

//    void apply_hf_exchange2(vecfuncT& phisa, vecfuncT& phisb,

//                           vecfuncT& funcsa, vecfuncT& funcsb,

//                           double& xc)

//    {

//      Vector<double,3> q {0.0,0.0,0.0};

//      SeparatedConvolution<double_complex,3> hfexop =

//          PeriodicHFExchangeOperator(_world, q, _params.lo,

//              FunctionDefaults<3>::get_thresh() * 0.1);

//      for (unsigned int i = 0; i < phisa.size(); i++)

//      {

//        bool isreal1 = is_real<T,NDIM>(phisa[i]);

//        MADNESS_ASSERT(isreal1);

////        rfunctionT phi_i = real(phisa[i]);

//        for (unsigned int j = 0; j < phisa.size(); j++)

//        {

//          bool isreal2 = is_real<T,NDIM>(phisa[j]);

//          MADNESS_ASSERT(isreal2);

////          rfunctionT phi_j = real(phisa[j]);

////          rfunctionT prod = phi_i*phi_j;

//          functionT prod = phisa[i]*phisa[j];

//          prod.truncate();

////          rfunctionT Vex = apply(*_cop,prod);

//          rfunctionT Vex = real(apply(hfexop,prod));

//          functionT tf1 = Vex*phisa[j];

//          funcsa[i] -= tf1;

//          xc -= real(inner(phisa[i],tf1));

//        }

//      }

//    }

    //*************************************************************************


    // working for a molecule / atom ... works for a gamma point calculation

    //*************************************************************************


    void apply_hf_exchange3(vecfuncT& phisa, vecfuncT& phisb,

                            vecfuncT& funcsa, vecfuncT& funcsb,

                            double& xc)

    {

      for (unsigned int j = 0; j < phisa.size(); j++)

      {

        rfunctionT phi_j = real(phisa[j]);

        // do diagonal piece first

        rfunctionT dprod = phi_j*phi_j;

        dprod.truncate();

        rfunctionT dVex = apply(*_cop,dprod);

        functionT tf_jjj = dVex*phisa[j];

        funcsa[j] -= tf_jjj;

        xc -= real(inner(phisa[j],tf_jjj));

        for (unsigned int i = j+1; i < phisa.size(); i++)

        {

          rfunctionT phi_i = real(phisa[i]);

          rfunctionT prod = phi_i*phi_j;

          prod.truncate();

          rfunctionT Vex = apply(*_cop,prod);

          // do the jij-th term

          functionT tf_jij = Vex*phisa[j];

          funcsa[i] -= tf_jij;

          xc -= real(inner(phisa[i],tf_jij));

          // do the iji-th term (in the complex case, use the complex

          // conjugate)

          functionT tf_iji = Vex*phisa[i];

          funcsa[j] -= tf_iji;

          xc -= real(inner(phisa[j],tf_iji));

        }

      }

    }


    //*************************************************************************


    //*************************************************************************


    KPoint find_kpt_from_orb(unsigned int idx)

    {

      for (unsigned int i = 0; i < _kpoints.size(); i++)

      {

        KPoint k1 = _kpoints[i];

        if (k1.is_orb_in_kpoint(idx)) return k1;

      }

      MADNESS_EXCEPTION("Error: find_kpt_from_orb: didn't find kpoint\n", 0);

    }


    //************************************************************************


    // hf exchange with k-points for periodic solid

    //*************************************************************************


    void apply_hf_exchange4(vecfuncT& phisa, vecfuncT& phisb,

                           vecfuncT& funcsa, vecfuncT& funcsb,

                           double& xc)

    {

      for (unsigned int i = 0; i < phisa.size(); i++)

      {

        functionT phi_i = phisa[i];

        KPoint k_i = find_kpt_from_orb(i);

        for (unsigned int j = 0; j < phisa.size(); j++)

        {

          functionT phi_j = phisa[j];

          KPoint k_j = find_kpt_from_orb(j);

          Vector<double,3> q {(k_i.k[0]-k_j.k[0])*_params.L,

                              (k_i.k[1]-k_j.k[1])*_params.L,

                              (k_i.k[2]-k_j.k[2])*_params.L};

          Vector<double,3> q2 {k_i.k[0]-k_j.k[0],

                               k_i.k[1]-k_j.k[1],

                               k_i.k[2]-k_j.k[2]};

          functionT cexp =

              factoryT(_world).functor(functorT(new

                  ComplexExp<3>(q2, double_complex(1.0,0.0))));

          functionT cexp2 = conj(cexp);

          cexp.truncate();

          cexp2.truncate();

          functionT prod = phi_i*phi_j*cexp;

          SeparatedConvolution<double_complex,3> hfexop =

              PeriodicHFExchangeOperator(_world, q, _params.lo,

                  FunctionDefaults<3>::get_thresh() * 0.1);

          functionT Vex = apply(hfexop,prod);

          functionT tf1 = Vex*phisa[j]*cexp2;

          funcsa[i] -= tf1;

          xc -= real(inner(phisa[i],tf1));

        }

      }

    }


    //*************************************************************************


    // not working and not tested .... supposed to be for the periodic boundary

    // conditions with k-points

    //*************************************************************************


    void apply_hf_exchange(vecfuncT& phisa, vecfuncT& phisb,

                           vecfuncT& funcsa, vecfuncT& funcsb)

    {

      for (unsigned int ink1 = 0, ik1 = 0; ink1 < _phisa.size(); ++ink1)

      {

        for (unsigned int ink2 = 0, ik2 = 0; ink2 <= ink1; ink2++)

        {

          KPoint k1 = _kpoints[ik1];

          KPoint k2 = _kpoints[ik2];


          if (ink1 == k1.end) ik1++;

          if (ink2 == k2.end) ik2++;


          MADNESS_ASSERT(ik1 == 0);

          MADNESS_ASSERT(ik2 == 0);


          // no phase factor

          if (ik1 == ik2)

          {

//            // same state (diagonal piece)

//            if (ink1 == ink2)

//            {

//              rfunctionT prod = abs_square(phisa[ink1]);

//              rfunctionT fr = apply(*_cop,prod);

//              funcsa[ink1] -= funcsa[ink1]*fr;

//            }

//            else

            {

              Vector<double,3> q = 0.0;

              functionT f = phisa[ink1]*conj(phisa[ink2]);

              SeparatedConvolution<double_complex,3> hfexop =

                  PeriodicHFExchangeOperator(_world, q, _params.lo, FunctionDefaults<3>::get_thresh() * 0.1);

              functionT fr = apply(hfexop,f);

              funcsa[ink1] -= funcsa[ink2]*fr;

              funcsa[ink2] -= funcsa[ink1]*conj(fr);


              // test code

              rfunctionT g1 = abs(phisa[ink1]);

              rfunctionT g2 = abs(phisa[ink2]);

              rfunctionT ff = g1*g2;


              printf("norm diff: %20.8f\n", abs(ff.norm2()-f.norm2()));

              MADNESS_ASSERT(abs(ff.norm2()-f.norm2()) <= 1e-5);

              rfunctionT fr2 = apply(*_cop,ff);

              MADNESS_ASSERT(abs(fr.norm2()-fr2.norm2()) <= 1e-5);

            }

          }

//          else

//          {

//            Vector<double,3> q = VectorFactory(k1.k[0]-k2.k[0],

//                                               k1.k[1]-k2.k[1],

//                                               k1.k[2]-k2.k[2]);

//            functionT cexp = factoryT(_world).functor(functorT(new ComplexExp<3>(q, double_complex(1.0,0.0))));

//            cexp.truncate();

//

//            functionT f = phisa[ink1]*conj(phisa[ink2])*cexp;

//            SeparatedConvolution<double_complex,3> hfexop =

//                PeriodicHFExchangeOperator(_world, q, _params.lo, FunctionDefaults<3>::get_thresh() * 0.1);

//            functionT fr = apply(hfexop,f);

//            funcsa[ink1] -= phisa[ink1]*fr*conj(cexp);

//            funcsa[ink2] -= phisa[ink2]*conj(fr)*cexp;

//          }

        }

      }

    }


    //*************************************************************************


    //*************************************************************************


    void reproject()

    {

      _params.waveorder += 2;

      _params.thresh /= 100;

      FunctionDefaults<3>::set_thresh(_params.thresh);

      FunctionDefaults<3>::set_k(_params.waveorder);

      if (_world.rank() == 0) _outputF << "reprojecting to wavelet order "

          << _params.waveorder << endl;

      reconstruct(_world, _phisa);

      for(unsigned int i = 0; i < _phisa.size(); i++)

      {

        _phisa[i] = madness::project(_phisa[i], FunctionDefaults<3>::get_k(),

          FunctionDefaults<3>::get_thresh(), false);

      }

      _world.gop.fence();

      truncate(_world, _phisa);

      normalize(_world, _phisa);

      if(_params.spinpol)

      {

        reconstruct(_world, _phisb);

        for(unsigned int i = 0; i < _phisb.size(); i++)

        {

            _phisb[i] = madness::project(_phisb[i], FunctionDefaults<3>::get_k(),

              FunctionDefaults<3>::get_thresh(), false);

        }

        _world.gop.fence();

        truncate(_world, _phisb);

        normalize(_world, _phisb);

      }


      delete _cop;

      make_nuclear_potential();

      //_subspace->reproject();

      delete _subspace;

      _subspace = new Subspace<T,NDIM>(_world, _params);

    }


    //*************************************************************************


    //*************************************************************************


    void solve()

    {


      // WSTHORNTON (debug) Test periodicity

//      if (_world.rank() == 0) printf("initial orbitals (periodicity) ...\n\n");

//      for (unsigned int i = 0; i < _phisa.size(); i++)

//      {

//        if (_world.rank() == 0) printf("orbital %d\n",i);

//        test_periodicity(_phisa[i]);

//        if (_world.rank() == 0) printf("\n\n");

//      }

//      if (_world.rank() == 0) printf("\n\n\n\n");


      if (_world.rank() == 0) print("size of phisa is:  ", _phisa.size());

      // keep track of how many iterations have gone by without reprojecting

      int rit = 0;

      int rpthresh = 20;

      for (_it = 0; _it < _params.maxits && _residual > _params.rcriterion; _it++, rit++)

      {

        // should we reproject?

        if ((_it > 0) && ((_residual < 20*_params.thresh) || (rit == rpthresh)))

        {

          // reproject orbitals and reset threshold

          reproject();

          rit = 0;

        }


        if (_world.rank() == 0) _outputF << "_it = " << _it << endl;


        // Set occupation numbers

        set_occs2(_kpoints,_eigsa,_eigsb,_occsa,_occsb);


        // Compute density

        rfunctionT rhoa = compute_rho(_phisa, _kpoints, _occsa);

        rfunctionT rhob = (_params.spinpol) ? compute_rho(_phisb, _kpoints, _occsb) : rhoa;

//        rfunctionT rhoa = _rhoa;

//        rfunctionT rhob = _rhob;

        double drhoa = (_rhoa-rhoa).trace();

        double drhob = (_rhob-rhob).trace();

        if (_world.rank() == 0)

        {

          printf("diff of alpha rho: %15.7f\n",drhoa);

          printf("diff of beta rho: %15.7f\n",drhob);

        }


        _rho = rhoa + rhob;


        _rhoa = rhoa;

        _rhob = rhob;

        double rtrace = _rho.trace();

        if (_world.rank() == 0) _outputF << "trace of rho" << rtrace << endl;


//        if(_it < 2 || (_it % 10) == 0)

//        {

//          START_TIMER(_world);

//          //loadbal();

//          END_TIMER(_world, "Load balancing");

//        }


        std::vector<functionT> pfuncsa =

                zero_functions<valueT,NDIM>(_world, _phisa.size());

        std::vector<functionT> pfuncsb =

                zero_functions<valueT,NDIM>(_world, _phisb.size());


        // Apply the potentials to the orbitals

        if (_world.rank() == 0) _outputF << "applying potential ...\n" << endl;

        //START_TIMER(_world);

        apply_potential(pfuncsa, pfuncsb, _phisa, _phisb, _rhoa, _rhob, _rho);

        //END_TIMER(_world,"apply potential");


        // Do right hand side for all k-points

        std::vector<double> alpha(pfuncsa.size(), 0.0);

        do_rhs_simple(_phisa, pfuncsa, _kpoints, alpha, _eigsa);


        if (_params.plotorbs)

        {

          std::vector<long> npt(3,101);

          for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

          {

            KPoint kpoint = _kpoints[ik];

            int ist = 0;

            for (unsigned int kst = kpoint.begin; kst < kpoint.end; kst++, ist++)

            {

              std::ostringstream strm;

              strm << "pre_unk_" << ik << "_" << ist << ".dx";

              std::string fname = strm.str();

              plotdx(_phisa[kst], fname.c_str(), FunctionDefaults<3>::get_cell(), npt);

            }

          }

        }

        // WSTHORNTON

        // DEBUG

        if (_world.rank() == 0)

          printf("\n\n\n\n------ Debugging BSH operator -----");

        for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

        {

          KPoint kpoint = _kpoints[ik];

          std::vector<double> k_alpha(alpha.begin() + kpoint.begin, alpha.begin() + kpoint.end);

          if (_world.rank() == 0)

            printf("alpha: (%6.4f,%6.4f,%6.4f)\n",kpoint.k[0],kpoint.k[1],kpoint.k[2]);

          for (unsigned int ia = 0; ia < k_alpha.size(); ia++)

          {

            if (_world.rank() == 0) printf("%15.8f\n", k_alpha[ia]);

          }

        }

        if (_world.rank() == 0) printf("\n\n\n\n");


        // WSTHORNTON (debug)

        if (_world.rank() == 0) printf("before BSH application ...\n\n");

        for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

        {

          KPoint kpoint = _kpoints[ik];

          double k0 = kpoint.k[0];

          double k1 = kpoint.k[1];

          double k2 = kpoint.k[2];

          if (_world.rank() == 0)

            printf("(%6.5f, %6.5f, %6.5f)\n",k0,k1,k2);

          std::vector<functionT> k_phisa(_phisa.begin() + kpoint.begin, _phisa.begin() + kpoint.end);

          std::vector<functionT> k_pfuncsa(pfuncsa.begin() + kpoint.begin, pfuncsa.begin() + kpoint.end);

          KPoint kpoint_gamma;

          print_fock_matrix_eigs(k_phisa, k_pfuncsa, kpoint_gamma);


          // diagonalize overlap

          tensorT overlap = matrix_inner(_world,k_pfuncsa,k_pfuncsa,true);

          ctensorT co; rtensorT eo;

          syev(overlap, co, eo);


          if (_world.rank() == 0) printf("Overlap eigenvalues: \n");

          if (_world.rank() == 0) print(overlap);

          for (unsigned int ie = 0; ie < eo.dim(0); ie++)

          {

            if (_world.rank() == 0) printf("%d    %15.8e\n", ie, eo(ie,ie));

          }


        }

        if (_world.rank() == 0) printf("\n\n\n\n");


        // WSTHORNTON (debug) Test periodicity

//        if (_world.rank() == 0) printf("before BSH application (periodicity) ...\n\n");

//        for (unsigned int i = 0; i < _phisa.size(); i++)

//        {

//          if (_world.rank() == 0) printf("orbital %d\n",i);

//          test_periodicity(_phisa[i]);

//          if (_world.rank() == 0) printf("\n\n");

//        }

//        if (_world.rank() == 0) printf("\n\n\n\n");


        // Make BSH Green's function

        std::vector<poperatorT> bopsa = make_bsh_operators(alpha);

        std::vector<T> sfactor(pfuncsa.size(), -2.0);

        scale(_world, pfuncsa, sfactor);


        // Apply Green's function to orbitals

        if (_world.rank() == 0) std::cout << "applying BSH operator ...\n" << endl;

        truncate<valueT,NDIM>(_world, pfuncsa);

        START_TIMER(_world);

        std::vector<functionT> tmpa = apply(_world, bopsa, pfuncsa);

        END_TIMER(_world,"apply BSH");

        bopsa.clear();


        // WSTHORNTON

        // norms

        if (_world.rank() == 0) printf("norms of tmpa\n");

        std::vector<double> tmpa_norms = norm2s(_world, tmpa);

        for (unsigned int i = 0; i < tmpa_norms.size(); i++)

        {

          if (_world.rank() == 0) printf("%10d     %15.8f\n", i, tmpa_norms[i]);

        }

        if (_world.rank() == 0) printf("\n\n\n\n");


        // Do other spin

        vecfuncT tmpb = zero_functions<valueT,NDIM>(_world, _phisb.size());

        if (_params.spinpol)

        {

          alpha = std::vector<double>(_phisb.size(), 0.0);

          do_rhs_simple(_phisb, pfuncsb,  _kpoints, alpha, _eigsb);

          std::vector<poperatorT> bopsb = make_bsh_operators(alpha);

          scale(_world, pfuncsb, sfactor);

          truncate<valueT,NDIM>(_world, pfuncsb);

          tmpb = apply(_world, bopsb, pfuncsb);

          bopsb.clear();

        }

        else

        {

          for (unsigned int i = 0; i < _eigsa.size(); i++) _eigsb[i] = _eigsa[i];

        }


        // WSTHORNTON (debug)

        std::vector<functionT> pfuncsa2=

                zero_functions<valueT,NDIM>(_world, _phisa.size());

        std::vector<functionT> pfuncsb2=

                zero_functions<valueT,NDIM>(_world, _phisa.size());


        // Apply the potentials to the orbitals

        if (_world.rank() == 0) _outputF << "applying potential2 ...\n" << endl;

        apply_potential(pfuncsa2, pfuncsb2, tmpa, tmpb, _rhoa, _rhob, _rho);

        for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

        {

          KPoint kpoint = _kpoints[ik];

          double k0 = kpoint.k[0];

          double k1 = kpoint.k[1];

          double k2 = kpoint.k[2];

          if (_world.rank() == 0)

            printf("(%6.5f, %6.5f, %6.5f)\n",k0,k1,k2);

          std::vector<functionT> k_tmpa(tmpa.begin() + kpoint.begin, tmpa.begin() + kpoint.end);

          std::vector<functionT> k_pfuncsa2(pfuncsa2.begin() + kpoint.begin, pfuncsa2.begin() + kpoint.end);

          print_fock_matrix_eigs(k_tmpa, k_pfuncsa2, kpoint);


          // diagonalize overlap

//          tensorT overlap = matrix_inner(_world,k_tmpa,k_tmpa,true);

//          if (_world.rank() == 0) print(overlap);

//          ctensorT co; rtensorT eo;

//          syev(overlap, co, eo);

//

//          if (_world.rank() == 0) printf("Overlap eigenvalues: \n");

//          for (unsigned int ie = 0; ie < eo.dim(0); ie++)

//          {

//            if (_world.rank() == 0) printf("%d    %15.8e\n", ie, eo(ie,ie));

//          }

        }

        if (_world.rank() == 0) printf("\n\n\n\n");


        if (_world.rank() == 0) printf("\n\n\n\n");


        // Update orbitals

        update_orbitals(tmpa, tmpb, _kpoints);

        save_orbitals();


        // WSTHORNTON

        if (_world.rank() == 0) _outputF << "after update_orbitals() ...\n" << endl;

        pfuncsa2=zero_functions<valueT,NDIM>(_world, _phisa.size());

        pfuncsb2=zero_functions<valueT,NDIM>(_world, _phisa.size());

        apply_potential(pfuncsa2, pfuncsb2, _phisa, _phisb, _rhoa, _rhob, _rho);

        for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

        {

          KPoint kpoint = _kpoints[ik];

          double k0 = kpoint.k[0];

          double k1 = kpoint.k[1];

          double k2 = kpoint.k[2];

          if (_world.rank() == 0)

            printf("(%6.5f, %6.5f, %6.5f)\n",k0,k1,k2);

          std::vector<functionT> k_phisa(_phisa.begin() + kpoint.begin, _phisa.begin() + kpoint.end);

          std::vector<functionT> k_pfuncsa2(pfuncsa2.begin() + kpoint.begin, pfuncsa2.begin() + kpoint.end);

          print_fock_matrix_eigs(k_phisa, k_pfuncsa2, kpoint);

        }

        if (_world.rank() == 0) printf("\n\n\n\n");


      }


      if (_params.plotorbs)

      {

        std::vector<long> npt(3,101);

        for (unsigned int ik = 0; ik < _kpoints.size(); ik++)

        {

          KPoint kpoint = _kpoints[ik];

          int ist = 0;

          for (unsigned int kst = kpoint.begin; kst < kpoint.end; kst++, ist++)

          {

            std::ostringstream strm;

            strm << "unk_" << ik << "_" << ist << ".dx";

            std::string fname = strm.str();

            plotdx(_phisa[kst], fname.c_str(), FunctionDefaults<3>::get_cell(), npt);

          }

        }

      }

      save_orbitals();

    }


    //*************************************************************************


    //*************************************************************************


    ctensorT matrix_exponential(const ctensorT& A) {

        const double tol = 1e-13;

        MADNESS_ASSERT(A.dim(0) == A.dim(1));


        // Scale A by a power of 2 until it is "small"

        double anorm = A.normf();

        int n = 0;

        double scale = 1.0;

        while (anorm*scale > 0.1)

        {

            n++;

            scale *= 0.5;

        }

        tensorT B = scale*A;    // B = A*2^-n


        // Compute exp(B) using Taylor series

        ctensorT expB = ctensorT(2, B.dims());

        for (int i = 0; i < expB.dim(0); i++) expB(i,i) = std::complex<T>(1.0,0.0);


        int k = 1;

        ctensorT term = B;

        while (term.normf() > tol)

        {

            expB += term;

            term = inner(term,B);

            k++;

            term.scale(1.0/k);

        }


        // Repeatedly square to recover exp(A)

        while (n--)

        {

            expB = inner(expB,expB);

        }


        return expB;

    }


    //*************************************************************************


    //*************************************************************************

    template<typename Q>


    void print_tensor2d(ostream& os, Tensor<Q> t)

    {

      os.precision(5);

      for (int i = 0; i < t.dim(0); i++)

      {

        for (int j = 0; j < t.dim(1); j++)

        {

          os << t(i,j) << setw(12);

        }

        os << endl;

      }

      os << endl;

    }


    //*************************************************************************


    //*************************************************************************


    void print_potential_matrix_eigs(const vecfuncT& wf, const vecfuncT& vwf)

    {

      // Build the potential matrix

      START_TIMER(_world);

      tensorT potential = matrix_inner(_world, wf, vwf, true);

      _world.gop.fence();

      END_TIMER(_world,"potential energy matrix");

      if (_world.rank()==0) printf("\n");

      tensorT overlap = matrix_inner(_world,wf,wf,true);

      _world.gop.fence();


      // diagonalize potential

      ctensorT cp; rtensorT ep;

      sygv(potential, overlap, 1, cp, ep);

      if (_world.rank() == 0)

      {

        print("potential eigenvectors dims:",cp.dim(0),cp.dim(1));

        print("potential eigenvectors:");

        print(cp);

        printf("\n\n");

        print("potential eigenvalues:");

        print(ep);

        printf("\n\n");

      }


    }


    //*************************************************************************


    //*************************************************************************


    void print_fock_matrix_eigs(const vecfuncT& wf, const vecfuncT& vwf, KPoint kpoint)

    {

      // Build the potential matrix

      START_TIMER(_world);

      tensorT potential = matrix_inner(_world, wf, vwf, true);

      _world.gop.fence();

      END_TIMER(_world,"potential energy matrix");

      if (_world.rank()==0) printf("\n");


      START_TIMER(_world);

      if (_world.rank() == 0) _outputF << "Building kinetic energy matrix ...\n\n" << endl;

        //tensorT kinetic = ::kinetic_energy_matrix_slow<T,NDIM>(_world, psi,

        //                                          _params.periodic,

        //                                          kpoint);

        tensorT kinetic = ::kinetic_energy_matrix<T,NDIM>(_world, wf,

                                                  _params.periodic,

                                                  kpoint);

      _world.gop.fence();

      END_TIMER(_world,"kinetic energy matrix");

      if (_world.rank() == 0) printf("\n");


      if (_world.rank() == 0) _outputF << "Constructing Fock matrix ...\n\n" << endl;

      tensorT fock = potential + kinetic;

      fock = 0.5 * (fock + conj_transpose(fock));

      _world.gop.fence();


      // DEBUG

      tensorT overlap = matrix_inner(_world,wf,wf,true);

      _world.gop.fence();


      // diagonlize kinetic

      ctensorT ck; rtensorT ek;

      sygv(kinetic, overlap, 1, ck, ek);

      // diagonalize potential

      ctensorT cp; rtensorT ep;

      sygv(potential, overlap, 1, cp, ep);

      // diagonalize overlap

      ctensorT co; rtensorT eo;

      syev(overlap, co, eo);

      ctensorT c; rtensorT e;

      sygv(fock, overlap, 1, c, e);


      if (_world.rank() == 0)

      {

        print("kinetic matrix:");

        print(kinetic);

        print("\nkinetic eigenvalues:");

        print(ek);

        print("\n");


        print("potential matrix:");

        print(potential);

        print("\npotential eigenvalues:");

        print(ep);

        print("\n");


        print("fock matrix:");

        print(fock);

        print("\nfock eigenvalues:");

        print(e);

        print("\n");

      }


    }


    //*************************************************************************


    //*************************************************************************


    void do_rhs(vecfuncT& wf,

                vecfuncT& vwf,

                std::vector<KPoint> kpoints,

                std::vector<T>& alpha,

                std::vector<double>& eigs)

    {

      // tolerance

      double trantol = 0.1*_params.thresh/std::min(30.0,double(wf.size()));

      double thresh = 1e-4;


      if (_world.rank() == 0) _eigF << "Iteration: " << _it << endl;

      for (unsigned int kp = 0; kp < kpoints.size(); kp++)

      {

        // Get k-point and orbitals for this k-point

        KPoint kpoint = kpoints[kp];

        double k0 = kpoint.k[0];

        double k1 = kpoint.k[1];

        double k2 = kpoint.k[2];

        // Extract the relevant portion of the list of orbitals and the list of the

        // V times the orbitals

        vecfuncT k_wf(wf.begin() + kpoint.begin, wf.begin() + kpoint.end);

        vecfuncT k_vwf(vwf.begin() + kpoint.begin, vwf.begin() + kpoint.end);

        // Build fock matrix

        tensorT fock = build_fock_matrix(k_wf, k_vwf, kpoint);

        tensorT overlap = matrix_inner(_world, k_wf, k_wf, true);


//        // Do right hand side stuff for kpoint

//        bool isgamma = (is_equal(k0,0.0,1e-5) &&

//                        is_equal(k1,0.0,1e-5) &&

//                        is_equal(k2,0.0,1e-5));

//        if (_params.periodic && !isgamma) // Non-zero k-point

//        {

//          // Do the gradient term and k^2/2

//          vecfuncT d_wf = zero_functions<valueT,NDIM>(_world, k_wf.size());

//          complex_derivative_3d Dx(_world,0);

//          complex_derivative_3d Dy(_world,1);

//          complex_derivative_3d Dz(_world,2);

//          for (unsigned int i = 0; i < k_wf.size(); i++)

//          {

//            // gradient

//            functionT dx_wf = Dx(k_wf[i]);

//            functionT dy_wf = Dy(k_wf[i]);

//            functionT dz_wf = Dz(k_wf[i]);

//            d_wf[i] = std::complex<T>(0.0,k0)*dx_wf +

//                      std::complex<T>(0.0,k1)*dy_wf +

//                      std::complex<T>(0.0,k2)*dz_wf;

//            // k^/2

//            double ksq = k0*k0 + k1*k1 + k2*k2;

//            k_vwf[i] += 0.5 * ksq * k_wf[i];

//            k_vwf[i] -= d_wf[i];

//          }

//        }


        if (_params.canon) // canonical orbitals

        {

          ctensorT U; rtensorT e;

          sygv(fock, overlap, 1, U, e);


          unsigned int nmo = k_wf.size();

          // Fix phases.

          long imax;

          for (long j = 0; j < nmo; j++)

          {

              // Get index of largest value in column

              U(_,j).absmax(&imax);

              T ang = arg(U(imax,j));

              std::complex<T> phase = exp(std::complex<T>(0.0,-ang));

              // Loop through the rest of the column and divide by the phase

              for (long i = 0; i < nmo; i++)

              {

                U(i,j) *= phase;

              }

          }


          // Within blocks with the same occupation number attempt to

          // keep orbitals in the same order (to avoid confusing the

          // non-linear solver).  Have to run the reordering multiple

          // times to handle multiple degeneracies.

          int maxpass = 5;

          for (int pass = 0; pass < maxpass; pass++)

          {

              long j;

              for (long i = 0; i < nmo; i++)

              {

                U(_, i).absmax(&j);

                if (i != j)

                {

                  tensorT tmp = copy(U(_, i));

                  U(_, i) = U(_, j);

                  U(_, j) = tmp;

                  //swap(e[i], e[j]);

                  T ti = e[i];

                  T tj = e[j];

                  e[i] = tj; e[j] = ti;

                }

              }

          }


          // Rotations between effectively degenerate states confound

          // the non-linear equation solver ... undo these rotations

          long ilo = 0; // first element of cluster

          while (ilo < nmo-1) {

              long ihi = ilo;

              while (fabs(real(e[ilo]-e[ihi+1])) < thresh*10.0*max(fabs(real(e[ilo])),1.0)) {

                  ihi++;

                  if (ihi == nmo-1) break;

              }

              long nclus = ihi - ilo + 1;

              if (nclus > 1) {

                  if (_world.rank() == 0) print("   found cluster", ilo, ihi);

                  tensorT q = copy(U(Slice(ilo,ihi),Slice(ilo,ihi)));

                  //print(q);

                  // Special code just for nclus=2

                  // double c = 0.5*(q(0,0) + q(1,1));

                  // double s = 0.5*(q(0,1) - q(1,0));

                  // double r = sqrt(c*c + s*s);

                  // c /= r;

                  // s /= r;

                  // q(0,0) = q(1,1) = c;

                  // q(0,1) = -s;

                  // q(1,0) = s;


                  // Iteratively construct unitary rotation by

                  // exponentiating the antisymmetric part of the matrix

                  // ... is quadratically convergent so just do 3

                  // iterations

                  ctensorT rot = matrix_exponential(-0.5*(q - conj_transpose(q)));

                  q = inner(q,rot);

                  ctensorT rot2 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                  q = inner(q,rot2);

                  ctensorT rot3 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                  q = inner(rot,inner(rot2,rot3));

                  U(_,Slice(ilo,ihi)) = inner(U(_,Slice(ilo,ihi)),q);

              }

              ilo = ihi+1;

          }


          // Debug output

          if (_params.print_matrices && _world.rank() == 0)

          {

              printf("(%10.5f, %10.5f, %10.5f)\n", k0, k1, k2);

              print("Overlap matrix:");

              print(overlap);


              print("Fock matrix:");

              print(fock);


              print("U matrix: (eigenvectors)");

              print(U);


              print("Fock matrix eigenvalues:");

              print(e);

          }


          // WSTHORNTON

          //print_fock_matrix_eigs(k_wf, k_vwf, kpoint);


          // transform orbitals and V * (orbitals)

          //k_vwf = transform(_world, k_vwf, U, 1e-5 / std::min(30.0, double(k_wf.size())), false);

          //k_wf = transform(_world, k_wf, U, FunctionDefaults<3>::get_thresh() / std::min(30.0, double(k_wf.size())), true);


          // WSTHORNTON

          //print_fock_matrix_eigs(k_wf, k_vwf, kpoint);


          // Do right hand side stuff for kpoint

          bool isgamma = (is_equal(k0,0.0,1e-5) &&

                          is_equal(k1,0.0,1e-5) &&

                          is_equal(k2,0.0,1e-5));

          if (_params.periodic && !isgamma) // Non-zero k-point

          {

            // Do the gradient term and k^2/2

            vecfuncT d_wf = zero_functions_compressed<valueT,NDIM>(_world, k_wf.size());

            complex_derivative_3d Dx(_world,0);

            complex_derivative_3d Dy(_world,1);

            complex_derivative_3d Dz(_world,2);

            for (unsigned int i = 0; i < k_wf.size(); i++)

            {

              // gradient

              functionT dx_wf = Dx(k_wf[i]);

              functionT dy_wf = Dy(k_wf[i]);

              functionT dz_wf = Dz(k_wf[i]);

              d_wf[i] = std::complex<T>(0.0,k0)*dx_wf +

                        std::complex<T>(0.0,k1)*dy_wf +

                        std::complex<T>(0.0,k2)*dz_wf;

              // k^/2

              double ksq = k0*k0 + k1*k1 + k2*k2;

              k_vwf[i] += 0.5 * ksq * k_wf[i];

              k_vwf[i] -= d_wf[i];

            }

          }


          // WSTHORNTON (new code)

          unsigned int eimax = -1;

          double eimaxval = -1e10;

          for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

            ei++, fi++)

          {

            if ((real(e(fi,fi)) > 0.0) && (real(e(fi,fi)) > eimaxval))

            {

              eimax = fi;

              eimaxval = real(e(fi,fi));

            }

          }


          double eshift = (eimaxval > 0.0) ? eimaxval + 0.1 : 0.0;

          for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

            ei++, fi++)

          {

            // Save the latest eigenvalues

            eigs[ei] = real(e(fi,fi));

            alpha[ei] = e(fi,fi)-eshift;

            k_vwf[fi] += (alpha[ei]-eigs[ei])*k_wf[fi];

          }


          if (_world.rank() == 0)

          {

            _eigF << "kpt: " << kp << endl;

            _eigF << setfill('-') << setw(20) << " " << endl;

            for (unsigned int ei = kpoint.begin; ei < kpoint.end; ei++)

            {

              char eigstr[50];

              printf("%3d%15.10f",ei,real(eigs[ei]));

//              _eigF << ei << setfill(' ') << setw(12) << real(eigs[ei]) << endl;

              _eigF << eigstr << endl;

            }

            _eigF << "\n\n" << endl;

          }

        }

        else // non-canonical orbitals

        {

          // diagonlize just to print eigenvalues

          tensorT overlap = matrix_inner(_world, k_wf, k_wf, true);

          ctensorT c; rtensorT e;

          sygv(fock, overlap, 1, c, e);

          for (unsigned int ei = 0; ei < e.dim(0); ei++)

          {

            double diffe = (ei == 0) ? 0.0 : real(e(ei,ei))-real(e(ei-1,ei-1));

            if (_world.rank() == 0)

              print("kpoint ", kp, "ei ", ei, "eps ", real(e(ei,ei)), "\tdiff\t", diffe);

          }


          for (unsigned int ei = kpoint.begin, fi = 0;

            ei < kpoint.end; ei++, fi++)

          {

            alpha[ei] = std::min(-0.1, real(fock(fi,fi)));

            fock(fi,fi) -= std::complex<T>(alpha[ei], 0.0);

          }


          std::vector<functionT> fwf = transform(_world, k_wf, fock, trantol);

          gaxpy(_world, 1.0, k_vwf, -1.0, fwf);

          fwf.clear();

        }

        for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

          wi++, fi++)

        {

          wf[wi] = k_wf[fi];

          vwf[wi] = k_vwf[fi];

        }

      }

    }


    //*************************************************************************


    //*************************************************************************


    void do_rhs_simple(vecfuncT& wf,

                vecfuncT& vwf,

                std::vector<KPoint> kpoints,

                std::vector<T>& alpha,

                std::vector<double>& eigs)

    {

      // tolerance

      double trantol = 0.1*_params.thresh/std::min(30.0,double(wf.size()));

      double thresh = 1e-4;


      if (_world.rank() == 0) _eigF << "Iteration: " << _it << endl;

      for (unsigned int kp = 0; kp < kpoints.size(); kp++)

      {

        // Get k-point and orbitals for this k-point

        KPoint kpoint = kpoints[kp];

        double k0 = kpoint.k[0];

        double k1 = kpoint.k[1];

        double k2 = kpoint.k[2];

        // Extract the relevant portion of the list of orbitals and the list of the

        // V times the orbitals

        vecfuncT k_wf(wf.begin() + kpoint.begin, wf.begin() + kpoint.end);

        vecfuncT k_vwf(vwf.begin() + kpoint.begin, vwf.begin() + kpoint.end);


        // Build fock matrix

        tensorT fock = build_fock_matrix(k_wf, k_vwf, kpoint);

        tensorT overlap = matrix_inner(_world, k_wf, k_wf, true);

        for (unsigned int i = 0; i < k_wf.size(); i++)

          fock(i,i) += std::complex<double>(i*_params.thresh*0.1,0.0);


        ctensorT U; rtensorT e;

        sygv(fock, overlap, 1, U, e);


        if (_params.print_matrices && _world.rank() == 0)

        {

            printf("(%10.5f, %10.5f, %10.5f)\n", k0, k1, k2);

            print("Overlap matrix:");

            print(overlap);


            print("Fock matrix:");

            print(fock);


            print("U matrix: (eigenvectors)");

            print(U);


            print("Fock matrix eigenvalues:");

            print(e);

        }


        // this is all of the B.S. for the solver

        if (_params.solver == 1)

        {

          unsigned int nmo = k_wf.size();

          // Fix phases.

          long imax;

          for (long j = 0; j < nmo; j++)

          {

              // Get index of largest value in column

              U(_,j).absmax(&imax);

              T ang = arg(U(imax,j));

              std::complex<T> phase = exp(std::complex<T>(0.0,-ang));

              // Loop through the rest of the column and divide by the phase

              for (long i = 0; i < nmo; i++)

              {

                U(i,j) *= phase;

              }

          }


          // Within blocks with the same occupation number attempt to

          // keep orbitals in the same order (to avoid confusing the

          // non-linear solver).  Have to run the reordering multiple

          // times to handle multiple degeneracies.

          int maxpass = 5;

          for (int pass = 0; pass < maxpass; pass++)

          {

              long j;

              for (long i = 0; i < nmo; i++)

              {

                U(_, i).absmax(&j);

                if (i != j)

                {

                  tensorT tmp = copy(U(_, i));

                  U(_, i) = U(_, j);

                  U(_, j) = tmp;

                  //swap(e[i], e[j]);

                  T ti = e[i];

                  T tj = e[j];

                  e[i] = tj; e[j] = ti;

                }

              }

          }


          // Rotations between effectively degenerate states confound

          // the non-linear equation solver ... undo these rotations

          long ilo = 0; // first element of cluster

          while (ilo < nmo-1) {

              long ihi = ilo;

              while (fabs(real(e[ilo]-e[ihi+1])) < thresh*10.0*max(fabs(real(e[ilo])),1.0)) {

                  ihi++;

                  if (ihi == nmo-1) break;

              }

              long nclus = ihi - ilo + 1;

              if (nclus > 1) {

                  if (_world.rank() == 0) print("   found cluster", ilo, ihi);

                  tensorT q = copy(U(Slice(ilo,ihi),Slice(ilo,ihi)));

                  //print(q);

                  // Special code just for nclus=2

                  // double c = 0.5*(q(0,0) + q(1,1));

                  // double s = 0.5*(q(0,1) - q(1,0));

                  // double r = sqrt(c*c + s*s);

                  // c /= r;

                  // s /= r;

                  // q(0,0) = q(1,1) = c;

                  // q(0,1) = -s;

                  // q(1,0) = s;


                  // Iteratively construct unitary rotation by

                  // exponentiating the antisymmetric part of the matrix

                  // ... is quadratically convergent so just do 3

                  // iterations

                  ctensorT rot = matrix_exponential(-0.5*(q - conj_transpose(q)));

                  q = inner(q,rot);

                  ctensorT rot2 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                  q = inner(q,rot2);

                  ctensorT rot3 = matrix_exponential(-0.5*(q - conj_transpose(q)));

                  q = inner(rot,inner(rot2,rot3));

                  U(_,Slice(ilo,ihi)) = inner(U(_,Slice(ilo,ihi)),q);

              }

              ilo = ihi+1;

          }

        }


        // transform orbitals and V * (orbitals)

        k_vwf = transform(_world, k_vwf, U, 1e-5 / std::min(30.0, double(k_wf.size())), false);

        k_wf = transform(_world, k_wf, U, FunctionDefaults<3>::get_thresh() / std::min(30.0, double(k_wf.size())), true);


        // Do right hand side stuff for kpoint

        bool isgamma = (is_equal(k0,0.0,1e-5) &&

                        is_equal(k1,0.0,1e-5) &&

                        is_equal(k2,0.0,1e-5));

        if (_params.periodic && !isgamma) // Non-zero k-point

        {

          // Do the gradient term and k^2/2

          vecfuncT d_wf = zero_functions_compressed<valueT,NDIM>(_world, k_wf.size());

          complex_derivative_3d Dx(_world,0);

          complex_derivative_3d Dy(_world,1);

          complex_derivative_3d Dz(_world,2);

          for (unsigned int i = 0; i < k_wf.size(); i++)

          {

            // gradient

            functionT dx_wf = Dx(k_wf[i]);

            functionT dy_wf = Dy(k_wf[i]);

            functionT dz_wf = Dz(k_wf[i]);


            // WSTHORNTON

//            double delxx = std::abs(inner(k_wf[i],Dx(Dx(k_wf[i]))));

//            double delyy = std::abs(inner(k_wf[i],Dy(Dy(k_wf[i]))));

//            double delzz = std::abs(inner(k_wf[i],Dz(Dz(k_wf[i]))));


//            if (_world.rank() == 0)

//              printf("orb %2.2d  delxx:  %15.8e  delyy:  %15.8e  delzz:  %15.8e\n",i, delxx, delyy, delzz);


            // WSTHORNTON

//            std::vector<long> npt(3,101);

//            char fnamedx[50];

//            sprintf(fnamedx, "xorb%2.2d__.dx",i);

//            plotdx(k_wf[i], fnamedx, FunctionDefaults<3>::get_cell(), npt);

//

//            char fnamedx_dx[50];

//            sprintf(fnamedx_dx, "xorb%2.2d__dx.dx",i);

//            plotdx(dx_wf, fnamedx_dx, FunctionDefaults<3>::get_cell(), npt);

//            char fnamedx_dy[50];

//            sprintf(fnamedx_dy, "xorb%2.2d__dy.dx",i);

//            plotdx(dy_wf, fnamedx_dy, FunctionDefaults<3>::get_cell(), npt);

//            char fnamedx_dz[50];

//            sprintf(fnamedx_dz, "xorb%2.2d__dz.dx",i);

//            plotdx(dz_wf, fnamedx_dz, FunctionDefaults<3>::get_cell(), npt);

//

//            rfunctionT xfunc = rfactoryT(_world).functor(

//              rfunctorT(new DipoleFunctor(0))).

//                thresh(_params.thresh).truncate_on_project();

//            rfunctionT yfunc = rfactoryT(_world).functor(

//              rfunctorT(new DipoleFunctor(1))).

//                thresh(_params.thresh).truncate_on_project();

//            rfunctionT zfunc = rfactoryT(_world).functor(

//              rfunctorT(new DipoleFunctor(2))).

//                thresh(_params.thresh).truncate_on_project();

//

//            double xdip = std::abs(inner(k_wf[i],xfunc*k_wf[i]));

//            double ydip = std::abs(inner(k_wf[i],yfunc*k_wf[i]));

//            double zdip = std::abs(inner(k_wf[i],zfunc*k_wf[i]));

//

//            if (_world.rank() == 0)

//              printf("orb: %1d     dipole moment: (%7.5e,%7.5e,%7.5e)\n",i,xdip,ydip,zdip);

//

//            double xdip1 = std::real(inner(k_wf[i],xfunc*k_wf[i]));

//            double ydip1 = std::real(inner(k_wf[i],yfunc*k_wf[i]));

//            double zdip1 = std::real(inner(k_wf[i],zfunc*k_wf[i]));

//

//            if (_world.rank() == 0)

//              printf("orb: %1d     dipole moment: (%7.5e,%7.5e,%7.5e)\n",i,xdip1,ydip1,zdip1);

//

//            double xdip2 = std::imag(inner(k_wf[i],xfunc*k_wf[i]));

//            double ydip2 = std::imag(inner(k_wf[i],yfunc*k_wf[i]));

//            double zdip2 = std::imag(inner(k_wf[i],zfunc*k_wf[i]));

//

//            if (_world.rank() == 0)

//              printf("orb: %1d     dipole moment: (%7.5e,%7.5e,%7.5e)\n\n\n",i,xdip2,ydip2,zdip2);

//

//            // WSTHORNTON

//            char fname_x[50];

//            char fname_y[50];

//            char fname_z[50];

//

//            char fnamex_x[50];

//            char fnamex_y[50];

//            char fnamex_z[50];

//

//            char fnamey_x[50];

//            char fnamey_y[50];

//            char fnamey_z[50];

//

//            char fnamez_x[50];

//            char fnamez_y[50];

//            char fnamez_z[50];

//

//            sprintf(fname_x, "orb%2.2d__x.dat",i);

//            sprintf(fname_y, "orb%2.2d__y.dat",i);

//            sprintf(fname_z, "orb%2.2d__z.dat",i);

//

//            sprintf(fnamex_x, "orb%2.2d_dx_x.dat",i);

//            sprintf(fnamex_y, "orb%2.2d_dx_y.dat",i);

//            sprintf(fnamex_z, "orb%2.2d_dx_z.dat",i);

//

//            sprintf(fnamey_x, "orb%2.2d_dy_x.dat",i);

//            sprintf(fnamey_y, "orb%2.2d_dy_y.dat",i);

//            sprintf(fnamey_z, "orb%2.2d_dy_z.dat",i);

//

//            sprintf(fnamez_x, "orb%2.2d_dz_x.dat",i);

//            sprintf(fnamez_y, "orb%2.2d_dz_y.dat",i);

//            sprintf(fnamez_z, "orb%2.2d_dz_z.dat",i);

//

//            coord_3d pt1x {-_params.L/2,0.0,0.0};

//            coord_3d pt2x { _params.L/2,0.0,0.0};

//

//            coord_3d pt1y {0.0,-_params.L/2,0.0};

//            coord_3d pt2y {0.0, _params.L/2,0.0};

//

//            coord_3d pt1z {0.0,0.0,-_params.L/2};

//            coord_3d pt2z {0.0,0.0, _params.L/2};

//

//            plot_line(fname_x,30000,pt1x,pt2x,k_wf[i]);

//            plot_line(fname_y,30000,pt1y,pt2y,k_wf[i]);

//            plot_line(fname_z,30000,pt1z,pt2z,k_wf[i]);

//

//            plot_line(fnamex_x,30000,pt1x,pt2x,dx_wf);

//            plot_line(fnamex_y,30000,pt1y,pt2y,dx_wf);

//            plot_line(fnamex_z,30000,pt1z,pt2z,dx_wf);

//

//            plot_line(fnamey_x,30000,pt1x,pt2x,dy_wf);

//            plot_line(fnamey_y,30000,pt1y,pt2y,dy_wf);

//            plot_line(fnamey_z,30000,pt1z,pt2z,dy_wf);

//

//            plot_line(fnamez_x,30000,pt1x,pt2x,dz_wf);

//            plot_line(fnamez_y,30000,pt1y,pt2y,dz_wf);

//            plot_line(fnamez_z,30000,pt1z,pt2z,dz_wf);


            d_wf[i] = std::complex<T>(0.0,k0)*dx_wf +

                      std::complex<T>(0.0,k1)*dy_wf +

                      std::complex<T>(0.0,k2)*dz_wf;

            // k^/2

            double ksq = k0*k0 + k1*k1 + k2*k2;

            k_vwf[i] += 0.5 * ksq * k_wf[i];

            k_vwf[i] -= d_wf[i];

          }

        }


        // WSTHORNTON (new code)

        unsigned int eimax = -1;

        double eimaxval = -1e10;

        for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

          ei++, fi++)

        {

          if ((real(e(fi,fi)) > 0.0) && (real(e(fi,fi)) > eimaxval))

          {

            eimax = fi;

            eimaxval = real(e(fi,fi));

          }

        }


        double eshift = (eimaxval > 0.0) ? eimaxval + 0.1 : 0.0;

        for (unsigned int ei = kpoint.begin, fi = 0; ei < kpoint.end;

          ei++, fi++)

        {

          // Save the latest eigenvalues

          eigs[ei] = real(e(fi,fi));

          alpha[ei] = e(fi,fi)-eshift;

          k_vwf[fi] += (alpha[ei]-eigs[ei])*k_wf[fi];

        }


//        if (_world.rank() == 0) printf("do_rhs_simple: (3) ...\n\n");

//        print_fock_matrix_eigs(k_wf, k_vwf, kpoint_gamma);


        if (_world.rank() == 0)

        {

          _eigF << "kpt: " << kp << endl;

          _eigF << setfill('-') << setw(20) << " " << endl;

          for (unsigned int ei = kpoint.begin; ei < kpoint.end; ei++)

          {

            char eigstr[50];

            sprintf(eigstr,"%3d%15.10f",ei,real(eigs[ei]));

            _eigF << eigstr << endl;

          }

          _eigF << "\n\n" << endl;

        }

        for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

          wi++, fi++)

        {

          wf[wi] = k_wf[fi];

          vwf[wi] = k_vwf[fi];

        }

      }

    }


    //*************************************************************************


    //*************************************************************************


    tensor_complex make_kinetic_matrix(World& world, const vector_complex_function_3d& v, const KPoint& k) {

        const double_complex I = double_complex(0.0,1.0);

        double kx = k.k[0];

        double ky = k.k[1];

        double kz = k.k[2];


        complex_derivative_3d Dx(world, 0);

        complex_derivative_3d Dy(world, 1);

        complex_derivative_3d Dz(world, 2);


        vector_complex_function_3d dvx = apply(world, Dx, v);

        vector_complex_function_3d dvy = apply(world, Dy, v);

        vector_complex_function_3d dvz = apply(world, Dz, v);


        // -1/2 (del + ik)^2 = -1/2 del^2 - i k.del + 1/2 k^2

        // -1/2 <p|del^2|q> = +1/2 <del p | del q>


        tensor_complex f1 = 0.5 * (matrix_inner(world, dvx, dvx, true) +

                                   matrix_inner(world, dvy, dvy, true) +

                                   matrix_inner(world, dvz, dvz, true));


        tensor_complex f2 =

            (-I*kx)*matrix_inner(world, v, dvx, false) +

            (-I*ky)*matrix_inner(world, v, dvy, false) +

            (-I*kz)*matrix_inner(world, v, dvz, false);


        tensor_complex f3 = (0.5 * (kx*kx + ky*ky + kz*kz)) * matrix_inner(world, v, v, true);


        return f1 + f2 + f3;

    }


    //*************************************************************************


    //*************************************************************************


    tensorT build_fock_matrix(vecfuncT& psi,

                              vecfuncT& vpsi,

                              KPoint kpoint)

    {

      // Build the potential matrix

      START_TIMER(_world);

      tensorT potential = matrix_inner(_world, psi, vpsi, true);

      _world.gop.fence();

      END_TIMER(_world,"potential energy matrix");

      if (_world.rank()==0) printf("\n");


      START_TIMER(_world);

      if (_world.rank() == 0) _outputF << "Building kinetic energy matrix ...\n\n" << endl;

        tensorT kinetic = ::kinetic_energy_matrix<T,NDIM>(_world, psi,

                                                  _params.periodic,

                                                  kpoint);

      tensorT kinetic2 = make_kinetic_matrix(_world, psi, kpoint);

      _world.gop.fence();

      END_TIMER(_world,"kinetic energy matrix");

      if (_world.rank() == 0) printf("\n");


      if (_world.rank() == 0) _outputF << "Constructing Fock matrix ...\n\n" << endl;

      tensorT fock = potential + kinetic;

      fock = 0.5 * (fock + conj_transpose(fock));

      _world.gop.fence();


      if (_world.rank() == 0)

      {

        print("KINETIC:");

        print(kinetic);

        print("KINETIC2:");

        print(kinetic2);

        print("POTENTIAL:");

        print(potential);

        print("FOCK:");

        print(fock);

      }


      return fock;

    }


    //*************************************************************************


    //*************************************************************************


    void gram_schmidt(vecfuncT& f, KPoint kpoint)

    {

      for (unsigned int fi = kpoint.begin; fi < kpoint.end; ++fi)

      {

        // Project out the lower states

        for (unsigned int fj = kpoint.begin; fj < fi; ++fj)

        {

          valueT overlap = inner(f[fj], f[fi]);

          f[fi] -= overlap*f[fj];

        }

        f[fi].scale(1.0/f[fi].norm2());

      }

    }


    //*************************************************************************


    //*************************************************************************

    /// Given overlap matrix, return rotation with 3rd order error to orthonormalize the vectors


    tensorT Q3(const tensorT& s) {

        tensorT Q = inner(s,s);

        Q.gaxpy(0.2,s,-2.0/3.0);

        for (int i=0; i<s.dim(0); ++i) Q(i,i) += 1.0;

        return Q.scale(15.0/8.0);

    }


    //*************************************************************************


    //*************************************************************************

    /// Computes matrix square root (not used any more?)


    ctensorT csqrt(const ctensorT& s, double tol=1e-8) {

        int n=s.dim(0), m=s.dim(1);

        MADNESS_ASSERT(n==m);

        ctensorT c; rtensorT e;

        //s.gaxpy(0.5,conj_transpose(s),0.5); // Ensure exact symmetry

        syev(s, c, e);

        for (int i=0; i<n; ++i) {

            if (e(i) < -tol) {

                MADNESS_EXCEPTION("Matrix square root: negative eigenvalue",i);

            }

            else if (e(i) < tol) { // Ugh ..

                print("Matrix square root: Warning: small eigenvalue ", i, e(i));

                e(i) = tol;

            }

            e(i) = 1.0/sqrt(e(i));

        }

        for (int j=0; j<n; ++j) {

            for (int i=0; i<n; ++i) {

                c(j,i) *= e(i);

            }

        }

        return c;

    }


    //*************************************************************************


    //*************************************************************************


    void orthonormalize(vecfuncT& wf, KPoint kpoint)

    {

      // extract k-point orbitals

      vecfuncT k_wf(wf.begin() + kpoint.begin, wf.begin() + kpoint.end);

      ctensorT S = matrix_inner(_world,k_wf,k_wf,true);

      printf("orthonormalize: \n");

      printf("before matrix (after): \n");

      print(S);

      ctensorT U = csqrt(S);

      k_wf = transform(_world, k_wf, U, _params.thresh, true);


      ctensorT S2 = matrix_inner(_world,k_wf,k_wf,true);

      printf("overlap matrix (after): \n");

      print(S2);

      for (unsigned int wi = kpoint.begin, fi = 0; wi < kpoint.end;

        wi++, fi++)

      {

        wf[wi] = k_wf[fi];

      }

    }


    //*************************************************************************


    //*************************************************************************


    vecfuncT compute_residual(const vecfuncT& awfs,

                              const vecfuncT& bwfs)

    {

      // vector of residual functions

      vecfuncT rm = sub(_world, _phisa, awfs);

      // if spin-polarized insert beta spin-orbital residual functions

      if (_params.spinpol)

      {

        vecfuncT br = sub(_world, _phisb, bwfs);

        rm.insert(rm.end(), br.begin(), br.end());

      }

      // scalar residual

      std::vector<double> rnvec = norm2s<valueT,NDIM>(_world, rm);

      double rnorm = 0.0;

      for (unsigned int i = 0; i < rnvec.size(); i++) rnorm += rnvec[i];

      // renormalize and print

      _residual = rnorm / rnvec.size();

      if (_world.rank() == 0) _outputF << "\nResiduals\n---------" << endl;

      if (_world.rank() == 0) _outputF << std::setiosflags(std::ios::scientific) << "residual = " << _residual << endl;

      if (_world.rank() == 0)

      {

        _outputF << endl;

        for (unsigned int i = 0; i < rnvec.size(); i++)

        {

          _outputF << "residual" << i << "\t" << rnvec[i] << endl;

        }

        _outputF << endl;

      }


      return rm;

    }


    //*************************************************************************


    void update_orbitals(vecfuncT& awfs,

                         vecfuncT& bwfs,

                         std::vector<KPoint> kpoints)

    {

      // truncate before we do anyting

      truncate<valueT,NDIM> (_world, awfs);

      truncate<valueT,NDIM> (_world, _phisa);

      if (_params.spinpol)

      {

        truncate<valueT,NDIM> (_world, bwfs);

        truncate<valueT,NDIM> (_world, _phisb);

      }

      // compute residual

      vecfuncT rm = compute_residual(awfs, bwfs);

      if (_params.solver > 0 && _params.maxsub > 1)

      {

        // nonlinear solver

        _subspace->update_subspace(awfs, bwfs, _phisa, _phisb, rm);

      }


      // do step restriction

      step_restriction(_phisa, awfs, 0);

      if (_params.spinpol)

      {

        step_restriction(_phisb, bwfs, 1);

      }

      // do gram-schmidt

      for (unsigned int kp = 0; kp < kpoints.size(); kp++)

      {

        gram_schmidt(awfs, kpoints[kp]);

//        orthonormalize(awfs, kpoints[kp]);

        if (_params.spinpol)

        {

          gram_schmidt(bwfs, kpoints[kp]);

//          orthonormalize(bwfs, kpoints[kp]);

        }

      }


      // update alpha and beta orbitals

      truncate<valueT,NDIM>(_world, awfs);

      for (unsigned int ai = 0; ai < awfs.size(); ai++) {

          _phisa[ai] = awfs[ai].scale(1.0 / awfs[ai].norm2());

      }

      if (_params.spinpol)

      {

        truncate<valueT,NDIM>(_world, bwfs);

        for (unsigned int bi = 0; bi < bwfs.size(); bi++)

        {

            _phisb[bi] = bwfs[bi].scale(1.0 / bwfs[bi].norm2());

        }

      }

      else

      {

        for (unsigned int ia = 0; ia < awfs.size(); ia++)

        {

          _phisb[ia] = _phisa[ia];

        }

      }

    }


    //*************************************************************************


    //*************************************************************************


    void step_restriction(vecfuncT& owfs,

                          vecfuncT& nwfs,

                          int aorb)

    {

      double s = (_it < 4) ? 0.75 : _params.sd;

      if (_world.rank() == 0) print("damping factor: ", s);

      for (unsigned int i = 0; i < owfs.size(); i++)

          nwfs[i].gaxpy(1.0 - s, owfs[i], s, false);

//      std::vector<double> rnorm = norm2s(_world, sub(_world, owfs, nwfs));

//      // Step restriction

//      int nres = 0;

//      for (unsigned int i = 0; i < owfs.size(); i++)

//      {

//        if (rnorm[i] > _params.maxrotn)

//        {

//          double s = _params.maxrotn / rnorm[i];

//          nres++;

//          if (_world.rank() == 0)

//          {

//            if (!aorb && nres == 1) _outputF << "  restricting step for alpha orbitals:" << endl;

//            if (aorb && nres == 1) _outputF << "  restricting step for beta orbitals:" << endl;

//            _outputF << i;

//          }

//          nwfs[i].gaxpy(s, owfs[i], 1.0 - s, false);

//        }

//      }

//      if (nres > 0 && _world.rank() == 0) printf("\n");

//      _world.gop.fence();

    }


    //*************************************************************************


    //*************************************************************************


    void fix_occupations(const std::vector<T>& eps,

                         std::vector<double>& occs)

    {

      // Find max/min eigenvalues

      double emax = eps[0];

      double emin = emax;

      for (int i = 0; i < eps.size(); i++)

      {

        emax = (eps[i] > emax) ? eps[i] : emax;

        emin = (eps[i] < emin) ? eps[i] : emin;

      }


      int maxits = 1000;

      // This is hardcoded to 2.0 (non-spinpolarized case) for now.

      double occmax = 2.0;

      // Fermi energy

      double efermi = 0.0;

      // Use bisection method to find the fermi energy and update occupation numbers

      bool bstop = false;

      // Some smoothing parameter

      double t1 = 1.0/_params.swidth;

      for (int it = 0; (it < maxits)&&(!bstop); it++)

      {

        // Proposed fermi energy

        efermi = 0.5 * (emax + emin);

        // Accumulated charge

        double charge = 0.0;

        // Loop over all eigenvalues and count the charge

        for (int i = 0; i < eps.size(); i++)

        {

          double x = (efermi-eps[i]) * t1;

          // need to add some smearing function here

          occs[i] = occmax*stheta_fd(x);

          charge += _kpoints[i].weight() * occs[i];

        }

        if (fabs(emax-emin) < 1e-5)

          bstop = true;

        else if (charge < _params.ncharge)

          emin = efermi;

        else

          emax = efermi;

      }

    }


    //*************************************************************************


//    //*************************************************************************

//    void update_eigenvalues(const vecfuncT& wavefs,

//        const vecfuncT& pfuncs, const vecfuncT& phis,

//        std::vector<T>& eigs)

//    {

//      // Update e

//      if (_world.rank() == 0) printf("Updating e ...\n\n");

//      for (unsigned int ei = 0; ei < eigs.size(); ei++)

//      {

//        functionT r = wavefs[ei] - phis[ei];

//        double tnorm = wavefs[ei].norm2();

//        // Compute correction to the eigenvalues

//        T ecorrection = -0.5*real(inner(pfuncs[ei], r)) / (tnorm*tnorm);

//        T eps_old = eigs[ei];

//        T eps_new = eps_old + ecorrection;

////        if (_world.rank() == 0) printf("ecorrection = %.8f\n\n", ecorrection);

////        if (_world.rank() == 0) printf("eps_old = %.8f eps_new = %.8f\n\n", eps_old, eps_new);

//        // Sometimes eps_new can go positive, THIS WILL CAUSE THE ALGORITHM TO CRASH. So,

//        // I bounce the new eigenvalue back into the negative side of the real axis. I

//        // keep doing this until it's good or I've already done it 10 times.

//        int counter = 50;

//        while (eps_new >= 0.0 && counter < 20)

//        {

//          // Split the difference between the new and old estimates of the

//          // pi-th eigenvalue.

//          eps_new = eps_old + 0.5 * (eps_new - eps_old);

//          counter++;

//        }

//        // Still no go, forget about it. (1$ to Donnie Brasco)

//        if (eps_new >= 0.0)

//        {

//          if (_world.rank() == 0) printf("FAILURE OF WST: exiting!!\n\n");

//          _exit(0);

//        }

//        // Set new eigenvalue

//        eigs[ei] = eps_new;

//      }

//    }

//    //*************************************************************************


//    //*************************************************************************

//    double get_eig(int indx)

//    {

//      return _solver->get_eig(indx);

//    }

//    //*************************************************************************

//

//    //*************************************************************************

//    functionT get_phi(int indx)

//    {

//      return _solver->get_phi(indx);

//    }

//    //*************************************************************************

//

//    //*************************************************************************

//    const std::vector<double>& eigs()

//    {

//      return _solver->eigs();

//    }

//    //*************************************************************************

//

//    //*************************************************************************

//    const vecfuncT& phis()

//    {

//      return _solver->phis();

//    }

//    //*************************************************************************


  };


  //***************************************************************************


}

#define SOLVER_H_


#endif /* SOLVER_H_ */

potential
double potential(const coord_3d &r)
Definition 3dharmonic.cc:132

q
double q(double t)
Definition DKops.h:18

MADworld.h
This header should include pretty much everything needed for the parallel runtime.

double_complex
std::complex< double > double_complex
Definition cfft.h:14

A
Definition test_ar.cc:118

B
Definition test_ar.cc:141

MolecularEntity
Definition mentity.h:95

MolecularEntity::read_file
void read_file(const std::string &filename, bool fractional)
Definition mentity.cc:289

MolecularEntity::natom
int natom() const
Definition mentity.h:112

MolecularEntity::total_nuclear_charge
double total_nuclear_charge() const
Definition mentity.cc:444

MolecularEntity::center
void center()
Moves the center of nuclear charge to the origin.
Definition mentity.cc:413

MolecularEntity::get_atom
const Atom & get_atom(unsigned int i) const
Definition mentity.cc:369

MolecularNuclearChargeDensityFunctor
Definition electronicstructureapp.h:85

madness::Atom
Definition molecule.h:60

madness::Atom::y
double y
Definition molecule.h:62

madness::Atom::x
double x
Definition molecule.h:62

madness::Atom::z
double z
Definition molecule.h:62

madness::AtomicBasisFunction
Used to represent one basis function from a shell on a specific center.
Definition madness/chem/molecularbasis.h:409

madness::AtomicBasisFunction::get_coords
void get_coords(double &x, double &y, double &z) const
Definition madness/chem/molecularbasis.h:454

madness::AtomicBasisSet
Contracted Gaussian basis.
Definition madness/chem/molecularbasis.h:469

madness::AtomicBasisSet::eval_guess_density
double eval_guess_density(const Molecule &molecule, double x, double y, double z) const
Evaluates the guess density.
Definition madness/chem/molecularbasis.h:646

madness::AtomicBasisSet::get_atomic_basis_function
AtomicBasisFunction get_atomic_basis_function(const Molecule &molecule, size_t ibf) const
Returns the ibf'th atomic basis function.
Definition madness/chem/molecularbasis.h:600

madness::AtomicBasisSet::read_file
void read_file(std::string filename)
read the atomic basis set from file
Definition molecularbasis.cc:119

madness::AtomicBasisSet::nbf
int nbf(const Molecule &molecule) const
Given a molecule count the number of basis functions.
Definition madness/chem/molecularbasis.h:624

madness::BaseTensor::dim
long dim(int i) const
Returns the size of dimension i.
Definition basetensor.h:147

madness::ComplexExp
Definition solver.h:98

madness::ComplexExp::exponent
const vec3dT exponent
Definition solver.h:103

madness::ComplexExp::coordT
Vector< double, NDIM > coordT
Definition solver.h:100

madness::ComplexExp::operator()
double_complex operator()(const coordT &x) const
You should implement this to return f(x)
Definition solver.h:108

madness::ComplexExp::ComplexExp
ComplexExp(vec3dT exponent, double_complex coeff)
Definition solver.h:105

madness::ComplexExp::vec3dT
Vector< double, NDIM > vec3dT
Definition solver.h:101

madness::ComplexExp::coeff
const double_complex coeff
Definition solver.h:102

madness::Derivative
Implements derivatives operators with variety of boundary conditions on simulation domain.
Definition derivative.h:266

madness::DipoleFunctor
A MADNESS functor to compute either x, y, or z.
Definition solver.h:165

madness::DipoleFunctor::~DipoleFunctor
virtual ~DipoleFunctor()
Definition solver.h:173

madness::DipoleFunctor::DipoleFunctor
DipoleFunctor(int axis)
Definition solver.h:169

madness::DipoleFunctor::operator()
double operator()(const coordT &x) const
Definition solver.h:170

madness::DipoleFunctor::axis
const int axis
Definition solver.h:167

madness::FunctionDefaults
FunctionDefaults holds default paramaters as static class members.
Definition funcdefaults.h:100

madness::FunctionDefaults::get_k
static int get_k()
Returns the default wavelet order.
Definition funcdefaults.h:163

madness::FunctionDefaults::set_thresh
static void set_thresh(double value)
Sets the default threshold.
Definition funcdefaults.h:183

madness::FunctionDefaults::set_k
static void set_k(int value)
Sets the default wavelet order.
Definition funcdefaults.h:170

madness::FunctionDefaults::get_thresh
static const double & get_thresh()
Returns the default threshold.
Definition funcdefaults.h:176

madness::FunctionDefaults::set_bc
static void set_bc(const BoundaryConditions< NDIM > &value)
Sets the default boundary conditions.
Definition funcdefaults.h:319

madness::FunctionDefaults::get_cell_width
static const Tensor< double > & get_cell_width()
Returns the width of each user cell dimension.
Definition funcdefaults.h:369

madness::FunctionDefaults::set_cubic_cell
static void set_cubic_cell(double lo, double hi)
Sets the user cell to be cubic with each dimension having range [lo,hi].
Definition funcdefaults.h:362

madness::FunctionDefaults::get_cell
static const Tensor< double > & get_cell()
Gets the user cell for the simulation.
Definition funcdefaults.h:347

madness::FunctionFactory
FunctionFactory implements the named-parameter idiom for Function.
Definition function_factory.h:86

madness::FunctionFunctorInterface
Abstract base class interface required for functors used as input to Functions.
Definition function_interface.h:68

madness::Function
A multiresolution adaptive numerical function.
Definition mra.h:139

madness::KPoint
Definition eigsolver.h:63

madness::KPoint::weight
double weight()
Definition eigsolver.h:78

madness::MolecularPotentialFunctor
Functor for evaluating the nuclear attraction potential of a molecule at a given point.
Definition potentialmanager.h:69

madness::SeparatedConvolution
Convolutions in separated form (including Gaussian)
Definition operator.h:139

madness::Slice
A slice defines a sub-range or patch of a dimension.
Definition slice.h:103

madness::Solver
The main class of the periodic DFT solver.
Definition solver.h:619

madness::Solver::tensorT
Tensor< valueT > tensorT
Definition solver.h:632

madness::Solver::make_lda_potential
rfunctionT make_lda_potential(World &world, const rfunctionT &arho, const rfunctionT &brho, const rfunctionT &adelrhosq, const rfunctionT &bdelrhosq)
Definition solver.h:1230

madness::Solver::genkmesh
std::vector< KPoint > genkmesh(unsigned int ngridk0, unsigned ngridk1, unsigned int ngridk2, double koffset0, double koffset1, double koffset2, double R)
Definition solver.h:890

madness::Solver::compute_residual
vecfuncT compute_residual(const vecfuncT &awfs, const vecfuncT &bwfs)
Definition solver.h:3683

madness::Solver::vecfuncT
std::vector< functionT > vecfuncT
Definition solver.h:625

madness::Solver::_it
int _it
Definition solver.h:746

madness::Solver::make_bsh_operators
std::vector< poperatorT > make_bsh_operators(const std::vector< T > &eigs)
Definition solver.h:2081

madness::Solver::apply_hf_exchange3
void apply_hf_exchange3(vecfuncT &phisa, vecfuncT &phisb, vecfuncT &funcsa, vecfuncT &funcsb, double &xc)
Definition solver.h:2318

madness::Solver::apply_hf_exchange4
void apply_hf_exchange4(vecfuncT &phisa, vecfuncT &phisb, vecfuncT &funcsa, vecfuncT &funcsb, double &xc)
Definition solver.h:2366

madness::Solver::_world
World & _world
Definition solver.h:639

madness::Solver::do_rhs_simple
void do_rhs_simple(vecfuncT &wf, vecfuncT &vwf, std::vector< KPoint > kpoints, std::vector< T > &alpha, std::vector< double > &eigs)
Definition solver.h:3202

madness::Solver::_mentity
MolecularEntity _mentity
Definition solver.h:714

madness::Solver::init
void init(const std::string &filename)
Definition solver.h:789

madness::Solver::_aobasisf
cvecfuncT _aobasisf
Definition solver.h:750

madness::Solver::csqrt
ctensorT csqrt(const ctensorT &s, double tol=1e-8)
Computes matrix square root (not used any more?)
Definition solver.h:3634

madness::Solver::vecsubspaceT
std::vector< subspaceT > vecsubspaceT
Definition solver.h:636

madness::Solver::_phisa
vecfuncT _phisa
Definition solver.h:650

madness::Solver::functionT
Function< valueT, NDIM > functionT
Definition solver.h:624

madness::Solver::matrix_exponential
ctensorT matrix_exponential(const ctensorT &A)
Definition solver.h:2786

madness::Solver::Solver
Solver(World &world, rfunctionT vnucrhon, vecfuncT phisa, vecfuncT phisb, std::vector< T > eigsa, std::vector< T > eigsb, ElectronicStructureParams params, MolecularEntity mentity)
Definition solver.h:1289

madness::Solver::_aobasis
AtomicBasisSet _aobasis
Definition solver.h:722

madness::Solver::_nao
int _nao
Definition solver.h:754

madness::Solver::make_kinetic_matrix
tensor_complex make_kinetic_matrix(World &world, const vector_complex_function_3d &v, const KPoint &k)
Definition solver.h:3531

madness::Solver::_vnucrhon
rfunctionT _vnucrhon
Definition solver.h:646

madness::Solver::_cop
SeparatedConvolution< T, NDIM > * _cop
Definition solver.h:698

madness::Solver::poperatorT
std::shared_ptr< operatorT> poperatorT
Definition solver.h:629

madness::Solver::set_occs2
void set_occs2(const std::vector< KPoint > &kpoints, const std::vector< double > &eigsa, const std::vector< double > &eigsb, std::vector< double > &occsa, std::vector< double > &occsb)
Definition solver.h:1893

madness::Solver::pairvecfuncT
std::pair< vecfuncT, vecfuncT > pairvecfuncT
Definition solver.h:633

madness::Solver::_matF
std::ofstream _matF
Definition solver.h:734

madness::Solver::valueT
std::complex< T > valueT
Definition solver.h:621

madness::Solver::_eigsa
std::vector< T > _eigsa
Definition solver.h:658

madness::Solver::_kpoints
std::vector< KPoint > _kpoints
Definition solver.h:670

madness::Solver::project_ao_basis
vecfuncT project_ao_basis(World &world, KPoint kpt)
Definition solver.h:1243

madness::Solver::vectensorT
std::vector< tensorT > vectensorT
Definition solver.h:635

madness::Solver::print_fock_matrix_eigs
void print_fock_matrix_eigs(const vecfuncT &wf, const vecfuncT &vwf, KPoint kpoint)
Definition solver.h:2872

madness::Solver::_occsb
std::vector< double > _occsb
Definition solver.h:678

madness::Solver::calculate_kinetic_energy
double calculate_kinetic_energy()
Definition solver.h:2135

madness::Solver::END_TIMER
void END_TIMER(World &world, const char *msg)
Definition solver.h:765

madness::Solver::rfactoryT
FunctionFactory< T, NDIM > rfactoryT
Definition solver.h:623

madness::Solver::find_kpt_from_orb
KPoint find_kpt_from_orb(unsigned int idx)
Definition solver.h:2353

madness::Solver::_vnuc
rfunctionT _vnuc
Definition solver.h:694

madness::Solver::_params
ElectronicStructureParams _params
Definition solver.h:666

madness::Solver::kvecT
Vector< double, NDIM > kvecT
Definition solver.h:627

madness::Solver::_occsa
std::vector< double > _occsa
Definition solver.h:674

madness::Solver::print_potential_matrix_eigs
void print_potential_matrix_eigs(const vecfuncT &wf, const vecfuncT &vwf)
Definition solver.h:2843

madness::Solver::save_orbitals
void save_orbitals()
Definition solver.h:921

madness::Solver::step_restriction
void step_restriction(vecfuncT &owfs, vecfuncT &nwfs, int aorb)
Definition solver.h:3778

madness::Solver::factoryT
FunctionFactory< valueT, NDIM > factoryT
Definition solver.h:626

madness::Solver::reproject
void reproject()
Definition solver.h:2474

madness::Solver::START_TIMER
void START_TIMER(World &world)
Definition solver.h:761

madness::Solver::_outputF
std::ofstream _outputF
Definition solver.h:730

madness::Solver::_residual
double _residual
Definition solver.h:718

madness::Solver::initial_guess
void initial_guess()
Initializes alpha and beta mos, occupation numbers, eigenvalues.
Definition solver.h:1316

madness::Solver::~Solver
virtual ~Solver()
Definition solver.h:1882

madness::Solver::test_periodicity
void test_periodicity(const Function< Q, 3 > &f)
Definition solver.h:1159

madness::Solver::make_nuclear_potential_impl
void make_nuclear_potential_impl()
Definition solver.h:1034

madness::Solver::Solver
Solver(World &world, rfunctionT vnucrhon, vecfuncT phis, std::vector< T > eigs, std::vector< KPoint > kpoints, std::vector< double > occs, ElectronicStructureParams params, MolecularEntity mentity)
Definition solver.h:1847

madness::Solver::_rhob
rfunctionT _rhob
Definition solver.h:686

madness::Solver::_eigsb
std::vector< T > _eigsb
Definition solver.h:662

madness::Solver::build_fock_matrix
tensorT build_fock_matrix(vecfuncT &psi, vecfuncT &vpsi, KPoint kpoint)
Definition solver.h:3564

madness::Solver::orthonormalize
void orthonormalize(vecfuncT &wf, KPoint kpoint)
Definition solver.h:3660

madness::Solver::Solver
Solver(World &world, const rfunctionT &vnucrhon, const vecfuncT &phis, const std::vector< T > &eigs, const ElectronicStructureParams &params, MolecularEntity mentity)
Definition solver.h:1812

madness::Solver::compute_rho
rfunctionT compute_rho(const vecfuncT &phis, std::vector< KPoint > kpoints, std::vector< double > occs)
Definition solver.h:2042

madness::Solver::rtensorT
Tensor< double > rtensorT
Definition solver.h:630

madness::Solver::subspaceT
std::vector< pairvecfuncT > subspaceT
Definition solver.h:634

madness::Solver::operatorT
SeparatedConvolution< T, 3 > operatorT
Definition solver.h:628

madness::Solver::_eigF
std::ofstream _eigF
Definition solver.h:738

madness::Solver::ctensorT
Tensor< std::complex< double > > ctensorT
Definition solver.h:631

madness::Solver::apply_hf_exchange
void apply_hf_exchange(vecfuncT &phisa, vecfuncT &phisb, vecfuncT &funcsa, vecfuncT &funcsb)
Definition solver.h:2406

madness::Solver::_subspace
Subspace< T, NDIM > * _subspace
Definition solver.h:710

madness::Solver::_rho
rfunctionT _rho
Definition solver.h:690

madness::Solver::sss
double sss
Definition solver.h:760

madness::Solver::make_nuclear_potential
void make_nuclear_potential()
Definition solver.h:1094

madness::Solver::make_nuclear_charge_density_impl
void make_nuclear_charge_density_impl()
Definition solver.h:1042

madness::Solver::_rhoa
rfunctionT _rhoa
Definition solver.h:682

madness::Solver::gram_schmidt
void gram_schmidt(vecfuncT &f, KPoint kpoint)
Definition solver.h:3607

madness::Solver::_phisb
vecfuncT _phisb
Definition solver.h:654

madness::Solver::_maxthresh
double _maxthresh
Definition solver.h:726

madness::Solver::solve
void solve()
Definition solver.h:2513

madness::Solver::rfunctionT
Function< T, NDIM > rfunctionT
Definition solver.h:622

madness::Solver::load_orbitals
void load_orbitals()
Definition solver.h:942

madness::Solver::do_rhs
void do_rhs(vecfuncT &wf, vecfuncT &vwf, std::vector< KPoint > kpoints, std::vector< T > &alpha, std::vector< double > &eigs)
Definition solver.h:2939

madness::Solver::Q3
tensorT Q3(const tensorT &s)
Given overlap matrix, return rotation with 3rd order error to orthonormalize the vectors.
Definition solver.h:3624

madness::Solver::ttt
double ttt
Definition solver.h:760

madness::Solver::fix_occupations
void fix_occupations(const std::vector< T > &eps, std::vector< double > &occs)
Definition solver.h:3810

madness::Solver::update_orbitals
void update_orbitals(vecfuncT &awfs, vecfuncT &bwfs, std::vector< KPoint > kpoints)
Definition solver.h:3716

madness::Solver::print_tensor2d
void print_tensor2d(ostream &os, Tensor< Q > t)
Definition solver.h:2827

madness::Solver::_kmeshF
std::ofstream _kmeshF
Definition solver.h:742

madness::Solver::Solver
Solver(World &world, const std::string &filename)
Definition solver.h:771

madness::SubspaceK
The SubspaceK class is a container class holding previous orbitals and residuals.
Definition solver.h:193

madness::SubspaceK::tensorT
Tensor< valueT > tensorT
Definition solver.h:200

madness::SubspaceK::_world
World & _world
Definition solver.h:205

madness::SubspaceK::_Q
vectensorT _Q
Definition solver.h:209

madness::SubspaceK::functionT
Function< valueT, NDIM > functionT
Definition solver.h:196

madness::SubspaceK::update_subspace
void update_subspace(vecfuncT &awfs_new, vecfuncT &bwfs_new, const vecfuncT &awfs_old, const vecfuncT &bwfs_old)
Definition solver.h:245

madness::SubspaceK::_kpoints
std::vector< KPoint > _kpoints
Definition solver.h:217

madness::SubspaceK::valueT
std::complex< T > valueT
Definition solver.h:195

madness::SubspaceK::_subspace
vecsubspaceT _subspace
Definition solver.h:213

madness::SubspaceK::vectensorT
std::vector< tensorT > vectensorT
Definition solver.h:201

madness::SubspaceK::vecsubspaceT
std::vector< subspaceT > vecsubspaceT
Definition solver.h:202

madness::SubspaceK::SubspaceK
SubspaceK(World &world, const ElectronicStructureParams &params, const std::vector< KPoint > &kpoints)
Definition solver.h:231

madness::SubspaceK::vecfuncT
std::vector< functionT > vecfuncT
Definition solver.h:197

madness::SubspaceK::subspaceT
std::vector< pairvecfuncT > subspaceT
Definition solver.h:199

madness::SubspaceK::_params
ElectronicStructureParams _params
Definition solver.h:221

madness::SubspaceK::pairvecfuncT
std::pair< vecfuncT, vecfuncT > pairvecfuncT
Definition solver.h:198

madness::SubspaceK::_residual
double _residual
Definition solver.h:225

madness::Subspace
The SubspaceK class is a container class holding previous orbitals and residuals.
Definition solver.h:409

madness::Subspace::_Q
tensorT _Q
Definition solver.h:423

madness::Subspace::_kpoints
std::vector< KPoint > _kpoints
Definition solver.h:431

madness::Subspace::pairvecfuncT
std::pair< vecfuncT, vecfuncT > pairvecfuncT
Definition solver.h:414

madness::Subspace::_params
ElectronicStructureParams _params
Definition solver.h:435

madness::Subspace::Subspace
Subspace(World &world, const ElectronicStructureParams &params)
Definition solver.h:441

madness::Subspace::subspaceT
std::vector< pairvecfuncT > subspaceT
Definition solver.h:415

madness::Subspace::_subspace
subspaceT _subspace
Definition solver.h:427

madness::Subspace::_world
World & _world
Definition solver.h:419

madness::Subspace::vecfuncT
std::vector< functionT > vecfuncT
Definition solver.h:413

madness::Subspace::tensorT
Tensor< valueT > tensorT
Definition solver.h:416

madness::Subspace::update_subspace
void update_subspace(vecfuncT &awfs_new, vecfuncT &bwfs_new, const vecfuncT &awfs_old, const vecfuncT &bwfs_old, const vecfuncT &rm)
Definition solver.h:448

madness::Subspace::functionT
Function< valueT, NDIM > functionT
Definition solver.h:412

madness::Subspace::valueT
std::complex< T > valueT
Definition solver.h:411

madness::Subspace::reproject
void reproject()
Definition solver.h:556

madness::Tensor
A tensor is a multidimensional array.
Definition tensor.h:317

madness::Tensor::ptr
T * ptr()
Returns a pointer to the internal data.
Definition tensor.h:1825

madness::Vector
A simple, fixed dimension vector.
Definition vector.h:64

madness::WSTAtomicBasisFunctor
Definition solver.h:120

madness::WSTAtomicBasisFunctor::ky
double ky
Definition solver.h:124

madness::WSTAtomicBasisFunctor::specialpt
std::vector< coord_3d > specialpt
Definition solver.h:126

madness::WSTAtomicBasisFunctor::special_points
std::vector< coord_3d > special_points() const
Override this to return list of special points to be refined more deeply.
Definition solver.h:158

madness::WSTAtomicBasisFunctor::kx
double kx
Definition solver.h:124

madness::WSTAtomicBasisFunctor::operator()
double_complex operator()(const coord_3d &x) const
Definition solver.h:140

madness::WSTAtomicBasisFunctor::L
double L
Definition solver.h:123

madness::WSTAtomicBasisFunctor::WSTAtomicBasisFunctor
WSTAtomicBasisFunctor(const AtomicBasisFunction &aofunc, double L, double kx, double ky, double kz)
Definition solver.h:128

madness::WSTAtomicBasisFunctor::aofunc
const AtomicBasisFunction aofunc
Definition solver.h:122

madness::WSTAtomicBasisFunctor::kz
double kz
Definition solver.h:124

madness::WSTAtomicBasisFunctor::~WSTAtomicBasisFunctor
~WSTAtomicBasisFunctor()
Definition solver.h:138

madness::WorldGopInterface::broadcast_serializable
void broadcast_serializable(objT &obj, ProcessID root)
Broadcast a serializable object.
Definition worldgop.h:756

madness::WorldGopInterface::fence
void fence(bool debug=false)
Synchronizes all processes in communicator AND globally ensures no pending AM or tasks.
Definition worldgop.cc:161

madness::WorldGopInterface::broadcast
void broadcast(void *buf, size_t nbyte, ProcessID root, bool dowork=true, Tag bcast_tag=-1)
Broadcasts bytes from process root while still processing AM & tasks.
Definition worldgop.cc:173

madness::WorldGopInterface::sum
void sum(T *buf, size_t nelem)
Inplace global sum while still processing AM & tasks.
Definition worldgop.h:872

madness::World
A parallel world class.
Definition world.h:132

madness::World::rank
ProcessID rank() const
Returns the process rank in this World (same as MPI_Comm_rank()).
Definition world.h:320

madness::World::size
ProcessID size() const
Returns the number of processes in this World (same as MPI_Comm_size()).
Definition world.h:330

madness::World::gop
WorldGopInterface & gop
Global operations.
Definition world.h:207

madness::archive::ParallelInputArchive
An archive for storing local or parallel data, wrapping a BinaryFstreamInputArchive.
Definition parallel_archive.h:366

madness::archive::ParallelOutputArchive
An archive for storing local or parallel data wrapping a BinaryFstreamOutputArchive.
Definition parallel_archive.h:321

complexfun.h

R
static const double R
Definition csqrt.cc:46

f1
double(* f1)(const coord_3d &)
Definition derivatives.cc:55

f3
double(* f3)(const coord_3d &)
Definition derivatives.cc:57

f2
double(* f2)(const coord_3d &)
Definition derivatives.cc:56

delta
const double delta
Definition dielectric_external_field.cc:119

electronicstructureparams.h

esolver.h

is_equal
bool is_equal(double val1, double val2, double eps)
Definition esolver.h:190

rfunctorT
std::shared_ptr< FunctionFunctorInterface< double, 3 > > rfunctorT
Definition esolver.h:46

fortran_ctypes.h
Correspondence between C++ and Fortran types.

T
auto T(World &world, response_space &f) -> response_space
Definition global_functions.cc:28

madness::Solver::compute_rho_slow
rfunctionT compute_rho_slow(const vecfuncT &phis, std::vector< KPoint > kpoints, std::vector< double > occs)
Compute the electronic density for either a molecular or periodic system.
Definition solver.h:2010

madness::stheta_fd
T stheta_fd(const T &x)
Definition solver.h:75

madness::Solver::apply_potential
void apply_potential(vecfuncT &pfuncsa, vecfuncT &pfuncsb, const vecfuncT &phisa, const vecfuncT &phisb, const rfunctionT &rhoa, const rfunctionT &rhob, const rfunctionT &rho)
Applies the LDA effective potential to each orbital. Currently only lda and spin-polarized is not imp...
Definition solver.h:2177

madness::conj_transpose
Tensor< T > conj_transpose(const Tensor< T > &t)
Returns a new deep copy of the complex conjugate transpose of the input tensor.
Definition tensor.h:2028

madness::arg
Tensor< typename Tensor< T >::scalar_type > arg(const Tensor< T > &t)
Return a new tensor holding the argument of each element of t (complex types only)
Definition tensor.h:2503

psi
double psi(const Vector< double, 3 > &r)
Definition hatom_energy.cc:78

v
static const double v
Definition hatom_sf_dirac.cc:20

oi
static const long oi
Definition he.cc:16

op
Tensor< double > op(const Tensor< double > &x)
Definition kain.cc:508

max
#define max(a, b)
Definition lda.h:51

libxc.h

rot
#define rot(x, k)
Definition lookup3.c:72

MADNESS_EXCEPTION
#define MADNESS_EXCEPTION(msg, value)
Macro for throwing a MADNESS exception.
Definition madness_exception.h:119

MADNESS_ASSERT
#define MADNESS_ASSERT(condition)
Assert a condition that should be free of side-effects since in release builds this might be a no-op.
Definition madness_exception.h:134

mra.h
Main include file for MADNESS and defines Function interface.

madness::constants::pi
constexpr double pi
Mathematical constant .
Definition constants.h:48

madness
Namespace for all elements and tools of MADNESS.
Definition DFParameters.h:10

madness::BC_PERIODIC
@ BC_PERIODIC
Definition bc.h:52

madness::filename
static const char * filename
Definition legendre.cc:96

madness::vector_complex_function_3d
std::vector< complex_function_3d > vector_complex_function_3d
Definition functypedefs.h:101

madness::abs
double abs(double x)
Definition complexfun.h:48

madness::cpu_time
static double cpu_time()
Returns the cpu time in seconds relative to an arbitrary origin.
Definition timers.h:127

madness::abssq
Function< double, NDIM > abssq(const Function< double_complex, NDIM > &z, bool fence=true)
Returns a new function that is the square of the absolute value of the input.
Definition mra.h:2778

madness::KAIN
Tensor< T > KAIN(const Tensor< T > &Q, double rcond=1e-12)
Solves non-linear equation using KAIN (returns coefficients to compute next vector)
Definition solvers.h:98

madness::coordT
Vector< double, 3 > coordT
Definition corepotential.cc:54

madness::sygv
void sygv(const Tensor< T > &A, const Tensor< T > &B, int itype, Tensor< T > &V, Tensor< typename Tensor< T >::scalar_type > &e)
Generalized real-symmetric or complex-Hermitian eigenproblem.
Definition lapack.cc:1052

madness::scale
response_space scale(response_space a, double b)

madness::sub
Function< TENSOR_RESULT_TYPE(L, R), NDIM > sub(const Function< L, NDIM > &left, const Function< R, NDIM > &right, bool fence=true)
Same as operator- but with optional fence and no automatic compression.
Definition mra.h:2035

madness::CoulombOperatorPtr
static SeparatedConvolution< double, 3 > * CoulombOperatorPtr(World &world, double lo, double eps, const array_of_bools< 3 > &lattice_sum=FunctionDefaults< 3 >::get_bc().is_periodic(), int k=FunctionDefaults< 3 >::get_k())
Factory function generating separated kernel for convolution with 1/r in 3D.
Definition operator.h:1818

madness::norm2s
std::vector< double > norm2s(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norms of a vector of functions.
Definition vmra.h:845

madness::truncate
void truncate(World &world, response_space &v, double tol, bool fence)
Definition basic_operators.cc:31

madness::transform
std::vector< Function< TENSOR_RESULT_TYPE(T, R), NDIM > > transform(World &world, const std::vector< Function< T, NDIM > > &v, const Tensor< R > &c, bool fence=true)
Transforms a vector of functions according to new[i] = sum[j] old[j]*c[j,i].
Definition vmra.h:707

madness::conj
Function< T, NDIM > conj(const Function< T, NDIM > &f, bool fence=true)
Return the complex conjugate of the input function with the same distribution and optional fence.
Definition mra.h:2110

madness::r2
static double r2(const coord_3d &x)
Definition smooth.h:45

madness::compress
void compress(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Compress a vector of functions.
Definition vmra.h:149

madness::reconstruct
const std::vector< Function< T, NDIM > > & reconstruct(const std::vector< Function< T, NDIM > > &v)
reconstruct a vector of functions
Definition vmra.h:162

madness::plotdx
void plotdx(const Function< T, NDIM > &f, const char *filename, const Tensor< double > &cell=FunctionDefaults< NDIM >::get_cell(), const std::vector< long > &npt=std::vector< long >(NDIM, 201L), bool binary=true)
Writes an OpenDX format file with a cube/slice of points on a uniform grid.
Definition mraimpl.h:3446

madness::norm2
double norm2(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norm of a vector of functions.
Definition vmra.h:871

madness::_
static const Slice _(0,-1, 1)

madness::tensor_complex
Tensor< double_complex > tensor_complex
Definition functypedefs.h:59

madness::mul_sparse
Function< TENSOR_RESULT_TYPE(L, R), NDIM > mul_sparse(const Function< L, NDIM > &left, const Function< R, NDIM > &right, double tol, bool fence=true)
Sparse multiplication — left and right must be reconstructed and if tol!=0 have tree of norms already...
Definition mra.h:1806

madness::print
void print(const T &t, const Ts &... ts)
Print items to std::cout (items separated by spaces) and terminate with a new line.
Definition print.h:225

madness::apply
response_space apply(World &world, std::vector< std::vector< std::shared_ptr< real_convolution_3d > > > &op, response_space &f)
Definition basic_operators.cc:43

madness::f
NDIM & f
Definition mra.h:2481

madness::functorT
std::shared_ptr< FunctionFunctorInterface< double, 3 > > functorT
Definition corepotential.cc:55

madness::wall_time
double wall_time()
Returns the wall time in seconds relative to an arbitrary origin.
Definition timers.cc:48

madness::cvecfuncT
std::vector< complex_functionT > cvecfuncT
Definition SCF.h:80

madness::inner
double inner(response_space &a, response_space &b)
Definition response_functions.h:640

madness::normalize
void normalize(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Normalizes a vector of functions — v[i] = v[i].scale(1.0/v[i].norm2())
Definition vmra.h:1810

madness::BSHOperatorPtr3D
static SeparatedConvolution< double, 3 > * BSHOperatorPtr3D(World &world, double mu, double lo, double eps, const array_of_bools< 3 > &lattice_summed=FunctionDefaults< 3 >::get_bc().is_periodic(), int k=FunctionDefaults< 3 >::get_k())
Factory function generating separated kernel for convolution with exp(-mu*r)/(4*pi*r) in 3D.
Definition operator.h:2089

madness::plot_line
void plot_line(World &world, const char *filename, int npt, const Vector< double, NDIM > &lo, const Vector< double, NDIM > &hi, const opT &op)
Generates ASCII file tabulating f(r) at npoints along line r=lo,...,hi.
Definition funcplot.h:442

madness::project
Function< T, NDIM > project(const Function< T, NDIM > &other, int k=FunctionDefaults< NDIM >::get_k(), double thresh=FunctionDefaults< NDIM >::get_thresh(), bool fence=true)
Definition mra.h:2464

madness::real
double real(double x)
Definition complexfun.h:52

madness::PeriodicHFExchangeOperator
static SeparatedConvolution< double_complex, 3 > PeriodicHFExchangeOperator(World &world, Vector< double, 3 > args, double lo, double eps, const array_of_bools< 3 > &lattice_sum=FunctionDefaults< 3 >::get_bc().is_periodic(), int k=FunctionDefaults< 3 >::get_k())
Factory function generating separated kernel for convolution with 1/r in 3D.
Definition operator.h:1775

madness::matrix_inner
void matrix_inner(DistributedMatrix< T > &A, const std::vector< Function< T, NDIM > > &f, const std::vector< Function< T, NDIM > > &g, bool sym=false)
Definition distpm.cc:46

madness::copy
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence.
Definition mra.h:2066

madness::syev
void syev(const Tensor< T > &A, Tensor< T > &V, Tensor< typename Tensor< T >::scalar_type > &e)
Real-symmetric or complex-Hermitian eigenproblem.
Definition lapack.cc:969

madness::phase
static double phase(long i)
Definition twoscale.cc:85

madness::gaxpy
void gaxpy(const double a, ScalarResult< T > &left, const double b, const T &right, const bool fence=true)
the result type of a macrotask must implement gaxpy
Definition macrotaskq.h:245

std::abs
static long abs(long a)
Definition tensor.h:218

xc
XCfunctional xc
Definition newsolver_lda.cc:53

poperator.h

Q
double Q(double a)
Definition relops.cc:20

c
static const double c
Definition relops.cc:10

m
static const double m
Definition relops.cc:9

thresh
static const double thresh
Definition rk.cc:45

k
static const long k
Definition rk.cc:44

solvers.h
Defines interfaces for optimization and non-linear equation solvers.

madness::ElectronicStructureParams
Definition electronicstructureparams.h:46

madness::ElectronicStructureParams::maxsub
unsigned int maxsub
Definition electronicstructureparams.h:86

madness::ElectronicStructureParams::spinpol
bool spinpol
Definition electronicstructureparams.h:56

madness::ElectronicStructureParams::nio
int nio
Definition electronicstructureparams.h:98

madness::ElectronicStructureParams::fractional
bool fractional
Definition electronicstructureparams.h:84

madness::ElectronicStructureParams::ncharge
double ncharge
Definition electronicstructureparams.h:103

madness::ElectronicStructureParams::koffset2
double koffset2
Definition electronicstructureparams.h:94

madness::ElectronicStructureParams::ngridk1
int ngridk1
Definition electronicstructureparams.h:78

madness::ElectronicStructureParams::ispotential
bool ispotential
Definition electronicstructureparams.h:62

madness::ElectronicStructureParams::restart
int restart
Definition electronicstructureparams.h:101

madness::ElectronicStructureParams::canon
bool canon
Definition electronicstructureparams.h:90

madness::ElectronicStructureParams::maxits
int maxits
Definition electronicstructureparams.h:60

madness::ElectronicStructureParams::rcriterion
double rcriterion
Definition electronicstructureparams.h:111

madness::ElectronicStructureParams::nempty
int nempty
Definition electronicstructureparams.h:72

madness::ElectronicStructureParams::nelec
int nelec
Definition electronicstructureparams.h:50

madness::ElectronicStructureParams::koffset1
double koffset1
Definition electronicstructureparams.h:94

madness::ElectronicStructureParams::nbands
int nbands
Definition electronicstructureparams.h:76

madness::ElectronicStructureParams::basis
std::string basis
Definition electronicstructureparams.h:96

madness::ElectronicStructureParams::read_file
void read_file(const std::string &filename)
Definition electronicstructureparams.h:170

madness::ElectronicStructureParams::waveorder
int waveorder
Definition electronicstructureparams.h:66

madness::ElectronicStructureParams::swidth
double swidth
Definition electronicstructureparams.h:105

madness::ElectronicStructureParams::sd
double sd
Definition electronicstructureparams.h:115

madness::ElectronicStructureParams::lo
double lo
Definition electronicstructureparams.h:54

madness::ElectronicStructureParams::thresh
double thresh
Definition electronicstructureparams.h:64

madness::ElectronicStructureParams::plotorbs
bool plotorbs
Definition electronicstructureparams.h:109

madness::ElectronicStructureParams::functional
int functional
Definition electronicstructureparams.h:52

madness::ElectronicStructureParams::ngridk0
int ngridk0
Definition electronicstructureparams.h:78

madness::ElectronicStructureParams::L
double L
Definition electronicstructureparams.h:48

madness::ElectronicStructureParams::centered
bool centered
Definition electronicstructureparams.h:113

madness::ElectronicStructureParams::print_matrices
bool print_matrices
Definition electronicstructureparams.h:107

madness::ElectronicStructureParams::solver
int solver
Definition electronicstructureparams.h:92

madness::ElectronicStructureParams::periodic
bool periodic
Definition electronicstructureparams.h:58

madness::ElectronicStructureParams::ngridk2
int ngridk2
Definition electronicstructureparams.h:78

madness::ElectronicStructureParams::koffset0
double koffset0
Definition electronicstructureparams.h:94

madness::Solver::GuessDensity
Definition solver.h:1121

madness::Solver::GuessDensity::operator()
double operator()(const coordT &x) const
Definition solver.h:1127

madness::Solver::GuessDensity::periodic
const bool periodic
Definition solver.h:1125

madness::Solver::GuessDensity::mentity
const MolecularEntity & mentity
Definition solver.h:1122

madness::Solver::GuessDensity::R
double R
Definition solver.h:1124

madness::Solver::GuessDensity::GuessDensity
GuessDensity(const MolecularEntity &mentity, const AtomicBasisSet &aobasis, const double &R, const bool &periodic)
Definition solver.h:1151

madness::Solver::GuessDensity::aobasis
const AtomicBasisSet & aobasis
Definition solver.h:1123

I
static const double_complex I
Definition tdse1d.cc:164

eshift
static const double eshift
Definition tdse1d.cc:153

sum
AtomicInt sum
Definition test_atomicint.cc:46

e
void e()
Definition test_sig.cc:75

ky
static const double ky
Definition testcosine.cc:16

kz
static const double kz
Definition testcosine.cc:16

kx
static const double kx
Definition testcosine.cc:16

alpha
static const double alpha
Definition testcosine.cc:10

START_TIMER
#define START_TIMER
Definition testgaxpyext.cc:9

END_TIMER
#define END_TIMER(msg)
Definition testgaxpyext.cc:10

one
constexpr coord_t one(1.0)

NDIM
constexpr std::size_t NDIM
Definition testgconv.cc:54

g1
double g1(const coord_t &r)
Definition testgconv.cc:122

npts
const auto npts
Definition testgconv.cc:52

k0
double k0
Definition testperiodic.cc:66

k2
double k2
Definition testperiodic.cc:68

k1
double k1
Definition testperiodic.cc:67

weight
FLOAT weight(const FLOAT &x)
Definition y.cc:309