madness/api-doc/exchangeoperator_8h_source.html

 #ifndef SRC_APPS_CHEM_EXCHANGEOPERATOR_H_

 #define SRC_APPS_CHEM_EXCHANGEOPERATOR_H_


 #include<madness.h>

 #include<madness/world/cloud.h>

 #include<madness/mra/macrotaskq.h>

 #include<madness/chem/SCFOperators.h>


 namespace madness {


 // forward declaration

 class SCF;

 class Nemo;


 template<typename T, std::size_t NDIM>

 class Exchange<T,NDIM>::ExchangeImpl {

     typedef Function<T, NDIM> functionT;

     typedef std::vector<functionT> vecfuncT;


     static inline std::atomic<long> apply_timer;

     static inline std::atomic<long> mul2_timer;

     static inline std::atomic<long> mul1_timer; ///< timing


     static void reset_timer() {

         mul1_timer = 0l;

         mul2_timer = 0l;

         apply_timer = 0l;

     }


     static void print_timer(World& world) {

         double t1 = double(mul1_timer) * 0.001;

         double t2 = double(apply_timer) * 0.001;

         double t3 = double(mul2_timer) * 0.001;

         world.gop.sum(t1);

         world.gop.sum(t2);

         world.gop.sum(t3);

         if (world.rank() == 0) {

             printf(" cpu time spent in multiply1   %8.2fs\n", t1);

             printf(" cpu time spent in apply       %8.2fs\n", t2);

             printf(" cpu time spent in multiply2   %8.2fs\n", t3);

         }

     }


 public:


     typedef Exchange<T,NDIM>::Algorithm Algorithm;

     Algorithm algorithm_ = multiworld_efficient;


     /// default ctor

     ExchangeImpl(World& world, const double lo, const double thresh) : world(world), lo(lo), thresh(thresh) {}


     /// ctor with a conventional calculation

     ExchangeImpl(World& world, const SCF *calc, const int ispin) ;


     /// ctor with a nemo calculation

     ExchangeImpl(World& world, const Nemo *nemo, const int ispin);


     /// set the bra and ket orbital spaces, and the occupation


     /// @param[in]  bra     bra space, must be provided as complex conjugate

     /// @param[in]  ket     ket space

     void set_bra_and_ket(const vecfuncT& bra, const vecfuncT& ket) {

         mo_bra = copy(world, bra);

         mo_ket = copy(world, ket);

     }


     std::string info() const {return "K";}


     static auto set_poisson(World& world, const double lo, const double econv = FunctionDefaults<3>::get_thresh()) {

         return std::shared_ptr<real_convolution_3d>(CoulombOperatorPtr(world, lo, econv));

     }


     /// apply the exchange operator on a vector of functions


     /// note that only one spin is used (either alpha or beta orbitals)

     /// @param[in]  vket       the orbitals |i> that the operator is applied on

     /// @return     a vector of orbitals  K| i>

     vecfuncT operator()(const vecfuncT& vket) const;


     bool is_symmetric() const { return symmetric_; }


     ExchangeImpl& set_taskq(std::shared_ptr<MacroTaskQ> taskq1) {

         this->taskq=taskq1;

         return *this;

     }


     ExchangeImpl& symmetric(const bool flag) {

         symmetric_ = flag;

         return *this;

     }


     ExchangeImpl& set_algorithm(const Algorithm& alg) {

         algorithm_ = alg;

         return *this;

     }


     ExchangeImpl& set_printlevel(const long& level) {

         printlevel=level;

         return *this;

     }


 private:


     /// exchange using macrotasks, i.e. apply K on a function in individual worlds

     vecfuncT K_macrotask_efficient(const vecfuncT& vket, const double mul_tol = 0.0) const;


     /// computing the full square of the double sum (over vket and the K orbitals)

     vecfuncT K_small_memory(const vecfuncT& vket, const double mul_tol = 0.0) const;


     /// computing the upper triangle of the double sum (over vket and the K orbitals)

     vecfuncT K_large_memory(const vecfuncT& vket, const double mul_tol = 0.0) const;


     /// computing the upper triangle of the double sum (over vket and the K orbitals)

     static vecfuncT compute_K_tile(World& world, const vecfuncT& mo_bra, const vecfuncT& mo_ket,

                                    const vecfuncT& vket, std::shared_ptr<real_convolution_3d> poisson,

                                    const bool symmetric, const double mul_tol = 0.0);


     inline bool do_print_timings() const { return (world.rank() == 0) and (printlevel >= 3); }


     inline bool printdebug() const {return printlevel >= 10; }


     World& world;

     std::shared_ptr<MacroTaskQ> taskq;

     bool symmetric_ = false;      /// is the exchange matrix symmetric? K phi_i = \sum_k \phi_k \int \phi_k \phi_i

     vecfuncT mo_bra, mo_ket;    ///< MOs for bra and ket

     double lo = 1.e-4;

     double thresh = FunctionDefaults<NDIM>::get_thresh();

     long printlevel = 0;

     double mul_tol = 0.0;


     class MacroTaskExchangeSimple : public MacroTaskOperationBase {


         long nresult;

         double lo = 1.e-4;

         double mul_tol = 1.e-7;

         bool symmetric = false;


         /// custom partitioning for the exchange operator in exchangeoperator.h


         /// arguments are: result[i] += sum_k vket[k] \int 1/r vbra[k] f[i]

         /// with f and vbra being batched, result and vket being passed on as a whole

         class MacroTaskPartitionerExchange : public MacroTaskPartitioner {

         public:

             MacroTaskPartitionerExchange(const bool symmetric) : symmetric(symmetric) {

                 max_batch_size=30;

             }


             bool symmetric = false;


             partitionT do_partitioning(const std::size_t& vsize1, const std::size_t& vsize2,

                                        const std::string policy) const override {


                 partitionT partition1 = do_1d_partition(vsize1, policy);

                 partitionT partition2 = do_1d_partition(vsize2, policy);

                 partitionT result;

                 for (auto i = partition1.begin(); i != partition1.end(); ++i) {

                     if (symmetric) {

                         for (auto j = i; j != partition1.end(); ++j) {

                             Batch batch(i->first.input[0], j->first.input[0], _);

                             double priority=compute_priority(batch);

                             result.push_back(std::make_pair(batch,priority));

                         }

                     } else {

                         for (auto j = partition2.begin(); j != partition2.end(); ++j) {

                             Batch batch(i->first.input[0], j->first.input[0], _);

                             double priority=compute_priority(batch);

                             result.push_back(std::make_pair(batch,priority));

                         }

                     }

                 }

                 return result;

             }


             /// compute the priority of this task for non-dumb scheduling


             /// \return the priority as double number (no limits)

             double compute_priority(const Batch& batch) const override {

                 MADNESS_CHECK(batch.input.size() == 2);   // must be quadratic batches

                 long nrow = batch.input[0].size();

                 long ncol = batch.input[1].size();

                 return double(nrow * ncol);

             }

         };


     public:

         MacroTaskExchangeSimple(const long nresult, const double lo, const double mul_tol, const bool symmetric)

                 : nresult(nresult), lo(lo), mul_tol(mul_tol), symmetric(symmetric) {

             partitioner.reset(new MacroTaskPartitionerExchange(symmetric));

         }


         // you need to define the exact argument(s) of operator() as tuple

         typedef std::tuple<const std::vector<Function<T, NDIM>>&,

                 const std::vector<Function<T, NDIM>>&,

                 const std::vector<Function<T, NDIM>>&> argtupleT;


         using resultT = std::vector<Function<T, NDIM>>;


         // you need to define an empty constructor for the result

         // resultT must implement operator+=(const resultT&)

         resultT allocator(World& world, const argtupleT& argtuple) const {

             std::size_t n = std::get<0>(argtuple).size();

             resultT result = zero_functions_compressed<T, NDIM>(world, n);

             return result;

         }


         std::vector<Function<T, NDIM>>

         operator()(const std::vector<Function<T, NDIM>>& vf_batch,     // will be batched (column)

                    const std::vector<Function<T, NDIM>>& bra_batch,    // will be batched (row)

                    const std::vector<Function<T, NDIM>>& vket) {       // will not be batched


             World& world = vf_batch.front().world();

             resultT Kf = zero_functions_compressed<T, NDIM>(world, nresult);


             bool diagonal_block = batch.input[0] == batch.input[1];

             auto& bra_range = batch.input[1];    // corresponds to vbra

             auto& vf_range = batch.input[0];       // corresponds to vf_batch


             if (vf_range.is_full_size()) vf_range.end = vf_batch.size();

             if (bra_range.is_full_size()) bra_range.end = bra_batch.size();


             MADNESS_CHECK(vf_range.end <= nresult);

             if (symmetric) MADNESS_CHECK(bra_range.end <= nresult);


             if (symmetric and diagonal_block) {

                 auto ket_batch = bra_range.copy_batch(vket);

                 vecfuncT resultcolumn = compute_diagonal_batch_in_symmetric_matrix(world, ket_batch, bra_batch,

                                                                                    vf_batch);


                 for (int i = vf_range.begin; i < vf_range.end; ++i)

                     Kf[i] += resultcolumn[i - vf_range.begin];


             } else if (symmetric and not diagonal_block) {

                 auto[resultcolumn, resultrow]=compute_offdiagonal_batch_in_symmetric_matrix(world, vket, bra_batch,

                                                                                             vf_batch);


                 for (int i = bra_range.begin; i < bra_range.end; ++i)

                     Kf[i] += resultcolumn[i - bra_range.begin];

                 for (int i = vf_range.begin; i < vf_range.end; ++i)

                     Kf[i] += resultrow[i - vf_range.begin];

             } else {

                 auto ket_batch = bra_range.copy_batch(vket);

                 vecfuncT resultcolumn = compute_batch_in_asymmetric_matrix(world, ket_batch, bra_batch, vf_batch);

                 for (int i = vf_range.begin; i < vf_range.end; ++i)

                     Kf[i] += resultcolumn[i - vf_range.begin];

             }

             return Kf;

         }


         /// compute a batch of the exchange matrix, with identical ranges, exploiting the matrix symmetry


         /// \param subworld     the world we're computing in

         /// \param cloud        where to store the results

         /// \param bra_batch    the bra batch of orbitals (including the nuclear correlation factor square)

         /// \param ket_batch    the ket batch of orbitals, i.e. the orbitals to premultiply with

         /// \param vf_batch     the argument of the exchange operator

         vecfuncT compute_diagonal_batch_in_symmetric_matrix(World& subworld,

                                                             const vecfuncT& ket_batch,      // is batched

                                                             const vecfuncT& bra_batch,      // is batched

                                                             const vecfuncT& vf_batch        // is batched

         ) const {

             double mul_tol = 0.0;

             double symmetric = true;

             auto poisson = Exchange<double, 3>::ExchangeImpl::set_poisson(subworld, lo);

             return Exchange<T, NDIM>::ExchangeImpl::compute_K_tile(subworld, bra_batch, ket_batch, vf_batch, poisson, symmetric,

                                                      mul_tol);

         }


         /// compute a batch of the exchange matrix, with non-identical ranges


         /// \param subworld     the world we're computing in

         /// \param cloud        where to store the results

         /// \param bra_batch    the bra batch of orbitals (including the nuclear correlation factor square)

         /// \param ket_batch    the ket batch of orbitals, i.e. the orbitals to premultiply with

         /// \param vf_batch     the argument of the exchange operator

         vecfuncT compute_batch_in_asymmetric_matrix(World& subworld,

                                                     const vecfuncT& ket_batch,

                                                     const vecfuncT& bra_batch,

                                                     const vecfuncT& vf_batch) const {

             double mul_tol = 0.0;

             double symmetric = false;

             auto poisson = Exchange<double, 3>::ExchangeImpl::set_poisson(subworld, lo);

             return Exchange<T, NDIM>::ExchangeImpl::compute_K_tile(subworld, bra_batch, ket_batch, vf_batch, poisson, symmetric,

                                                      mul_tol);

         }


         /// compute a batch of the exchange matrix, with non-identical ranges


         /// \param subworld     the world we're computing in

         /// \param cloud        where to store the results

         /// \param bra_batch    the bra batch of orbitals (including the nuclear correlation factor square)

         /// \param ket_batch    the ket batch of orbitals, i.e. the orbitals to premultiply with

         /// \param vf_batch     the argument of the exchange operator

         std::pair<vecfuncT, vecfuncT> compute_offdiagonal_batch_in_symmetric_matrix(World& subworld,

                                                                                     const vecfuncT& ket, // not batched

                                                                                     const vecfuncT& bra_batch, // batched

                                                                                     const vecfuncT& vf_batch) const; // batched


     };


 };


 } /* namespace madness */


 #endif /* SRC_APPS_CHEM_EXCHANGEOPERATOR_H_ */

SCFOperators.h
Operators for the molecular HF and DFT code.

madness::Batch
a batch consists of a 2D-input batch and a 1D-output batch: K-batch <- (I-batch, J-batch)
Definition: macrotaskpartitioner.h:132

madness::Batch::input
std::vector< Batch_1D > input
Definition: macrotaskpartitioner.h:135

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::MacroTaskPartitionerExchange
custom partitioning for the exchange operator in exchangeoperator.h
Definition: exchangeoperator.h:143

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::MacroTaskPartitionerExchange::compute_priority
double compute_priority(const Batch &batch) const override
compute the priority of this task for non-dumb scheduling
Definition: exchangeoperator.h:178

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::MacroTaskPartitionerExchange::MacroTaskPartitionerExchange
MacroTaskPartitionerExchange(const bool symmetric)
Definition: exchangeoperator.h:145

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::MacroTaskPartitionerExchange::do_partitioning
partitionT do_partitioning(const std::size_t &vsize1, const std::size_t &vsize2, const std::string policy) const override
override this if you want your own partitioning
Definition: exchangeoperator.h:151

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple
Definition: exchangeoperator.h:132

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::compute_diagonal_batch_in_symmetric_matrix
vecfuncT compute_diagonal_batch_in_symmetric_matrix(World &subworld, const vecfuncT &ket_batch, const vecfuncT &bra_batch, const vecfuncT &vf_batch) const
compute a batch of the exchange matrix, with identical ranges, exploiting the matrix symmetry
Definition: exchangeoperator.h:258

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::MacroTaskExchangeSimple
MacroTaskExchangeSimple(const long nresult, const double lo, const double mul_tol, const bool symmetric)
Definition: exchangeoperator.h:187

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::nresult
long nresult
Definition: exchangeoperator.h:134

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::resultT
std::vector< Function< T, NDIM > > resultT
Definition: exchangeoperator.h:198

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::compute_batch_in_asymmetric_matrix
vecfuncT compute_batch_in_asymmetric_matrix(World &subworld, const vecfuncT &ket_batch, const vecfuncT &bra_batch, const vecfuncT &vf_batch) const
compute a batch of the exchange matrix, with non-identical ranges
Definition: exchangeoperator.h:277

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::argtupleT
std::tuple< const std::vector< Function< T, NDIM > > &, const std::vector< Function< T, NDIM > > &, const std::vector< Function< T, NDIM > > & > argtupleT
Definition: exchangeoperator.h:196

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::allocator
resultT allocator(World &world, const argtupleT &argtuple) const
Definition: exchangeoperator.h:202

madness::Exchange::ExchangeImpl::MacroTaskExchangeSimple::operator()
std::vector< Function< T, NDIM > > operator()(const std::vector< Function< T, NDIM >> &vf_batch, const std::vector< Function< T, NDIM >> &bra_batch, const std::vector< Function< T, NDIM >> &vket)
Definition: exchangeoperator.h:209

madness::Exchange::ExchangeImpl
Definition: exchangeoperator.h:17

madness::Exchange::ExchangeImpl::mul1_timer
static std::atomic< long > mul1_timer
timing
Definition: exchangeoperator.h:23

madness::Exchange::ExchangeImpl::print_timer
static void print_timer(World &world)
Definition: exchangeoperator.h:31

madness::Exchange::ExchangeImpl::Algorithm
Exchange< T, NDIM >::Algorithm Algorithm
Definition: exchangeoperator.h:47

madness::Exchange::ExchangeImpl::set_taskq
ExchangeImpl & set_taskq(std::shared_ptr< MacroTaskQ > taskq1)
Definition: exchangeoperator.h:83

madness::Exchange::ExchangeImpl::set_algorithm
ExchangeImpl & set_algorithm(const Algorithm &alg)
Definition: exchangeoperator.h:93

madness::Exchange::ExchangeImpl::reset_timer
static void reset_timer()
Definition: exchangeoperator.h:25

madness::Exchange::ExchangeImpl::mo_bra
vecfuncT mo_bra
is the exchange matrix symmetric? K phi_i = \sum_k \phi_k \int \phi_k \phi_i
Definition: exchangeoperator.h:126

madness::Exchange::ExchangeImpl::world
World & world
Definition: exchangeoperator.h:123

madness::Exchange::ExchangeImpl::taskq
std::shared_ptr< MacroTaskQ > taskq
Definition: exchangeoperator.h:124

madness::Exchange::ExchangeImpl::symmetric
ExchangeImpl & symmetric(const bool flag)
Definition: exchangeoperator.h:88

madness::Exchange::ExchangeImpl::functionT
Function< T, NDIM > functionT
Definition: exchangeoperator.h:18

madness::Exchange::ExchangeImpl::is_symmetric
bool is_symmetric() const
Definition: exchangeoperator.h:81

madness::Exchange::ExchangeImpl::set_printlevel
ExchangeImpl & set_printlevel(const long &level)
Definition: exchangeoperator.h:98

madness::Exchange::ExchangeImpl::vecfuncT
std::vector< functionT > vecfuncT
Definition: exchangeoperator.h:19

madness::Exchange::ExchangeImpl::compute_K_tile
static vecfuncT compute_K_tile(World &world, const vecfuncT &mo_bra, const vecfuncT &mo_ket, const vecfuncT &vket, std::shared_ptr< real_convolution_3d > poisson, const bool symmetric, const double mul_tol=0.0)
computing the upper triangle of the double sum (over vket and the K orbitals)
Definition: exchangeoperator.cc:167

madness::Exchange::ExchangeImpl::apply_timer
static std::atomic< long > apply_timer
Definition: exchangeoperator.h:21

madness::Exchange::ExchangeImpl::ExchangeImpl
ExchangeImpl(World &world, const double lo, const double thresh)
default ctor
Definition: exchangeoperator.h:51

madness::Exchange::ExchangeImpl::info
std::string info() const
Definition: exchangeoperator.h:68

madness::Exchange::ExchangeImpl::do_print_timings
bool do_print_timings() const
Definition: exchangeoperator.h:119

madness::Exchange::ExchangeImpl::printdebug
bool printdebug() const
Definition: exchangeoperator.h:121

madness::Exchange::ExchangeImpl::set_poisson
static auto set_poisson(World &world, const double lo, const double econv=FunctionDefaults< 3 >::get_thresh())
Definition: exchangeoperator.h:70

madness::Exchange::ExchangeImpl::mul2_timer
static std::atomic< long > mul2_timer
Definition: exchangeoperator.h:22

madness::Exchange::ExchangeImpl::set_bra_and_ket
void set_bra_and_ket(const vecfuncT &bra, const vecfuncT &ket)
set the bra and ket orbital spaces, and the occupation
Definition: exchangeoperator.h:63

madness::Exchange
Definition: SCFOperators.h:104

madness::Exchange::operator()
Function< T, NDIM > operator()(const Function< T, NDIM > &ket) const
Definition: SCFOperators.h:150

madness::Exchange::Algorithm
Algorithm
Definition: SCFOperators.h:116

madness::Exchange::multiworld_efficient
@ multiworld_efficient
Definition: SCFOperators.h:117

madness::FunctionDefaults
FunctionDefaults holds default paramaters as static class members.
Definition: funcdefaults.h:204

madness::FunctionDefaults::get_thresh
static const double & get_thresh()
Returns the default threshold.
Definition: funcdefaults.h:279

madness::Function
A multiresolution adaptive numerical function.
Definition: mra.h:122

madness::MacroTaskOperationBase
Definition: macrotaskq.h:716

madness::MacroTaskPartitioner
partition one (two) vectors into 1D (2D) batches.
Definition: macrotaskpartitioner.h:190

madness::MacroTaskPartitioner::partitionT
std::list< std::pair< Batch, double > > partitionT
Definition: macrotaskpartitioner.h:194

madness::Nemo
The Nemo class.
Definition: nemo.h:326

madness::SCFOperatorBase::vecfuncT
std::vector< functionT > vecfuncT
Definition: SCFOperators.h:62

madness::SCFOperatorBase::taskq
std::shared_ptr< MacroTaskQ > taskq
Definition: SCFOperators.h:70

madness::SCF
Definition: SCF.h:187

madness::WorldGopInterface::sum
void sum(T *buf, size_t nelem)
Inplace global sum while still processing AM & tasks.
Definition: worldgop.h:870

madness::World
A parallel world class.
Definition: world.h:132

madness::World::rank
ProcessID rank() const
Returns the process rank in this World (same as MPI_Comm_rank()).
Definition: world.h:318

madness::World::gop
WorldGopInterface & gop
Global operations.
Definition: world.h:205

cloud.h
Declares the Cloud class for storing data and transfering them between worlds.

lo
static double lo
Definition: dirac-hatom.cc:23

T
auto T(World &world, response_space &f) -> response_space
Definition: global_functions.cc:34

macrotaskq.h
Declares the macrotaskq and MacroTaskBase classes.

madness.h
General header file for using MADNESS.

MADNESS_CHECK
#define MADNESS_CHECK(condition)
Check a condition — even in a release build the condition is always evaluated so it can have side eff...
Definition: madness_exception.h:190

madness
File holds all helper structures necessary for the CC_Operator and CC2 class.
Definition: DFParameters.h:10

madness::copy
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence.
Definition: mra.h:2002

madness::_
static const Slice _(0,-1, 1)

madness::CoulombOperatorPtr
static SeparatedConvolution< double, 3 > * CoulombOperatorPtr(World &world, double lo, double eps, const BoundaryConditions< 3 > &bc=FunctionDefaults< 3 >::get_bc(), int k=FunctionDefaults< 3 >::get_k())
Factory function generating separated kernel for convolution with 1/r in 3D.
Definition: operator.h:1762

thresh
static const double thresh
Definition: rk.cc:45

NDIM
static const std::size_t NDIM
Definition: testpdiff.cc:42