madness/api-doc/vmra1_8h_source.html

/*

  This file is part of MADNESS.


  Copyright (C) 2007,2010 Oak Ridge National Laboratory


  This program is free software; you can redistribute it and/or modify

  it under the terms of the GNU General Public License as published by

  the Free Software Foundation; either version 2 of the License, or

  (at your option) any later version.


  This program is distributed in the hope that it will be useful,

  but WITHOUT ANY WARRANTY; without even the implied warranty of

  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

  GNU General Public License for more details.


  You should have received a copy of the GNU General Public License

  along with this program; if not, write to the Free Software

  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA


  For more information please contact:


  Robert J. Harrison

  Oak Ridge National Laboratory

  One Bethel Valley Road

  P.O. Box 2008, MS-6367


  email: harrisonrj@ornl.gov

  tel:   865-241-3937

  fax:   865-572-0680


  $Id$

*/


#ifndef MADNESS_MRA_VMRA_H__INCLUDED

#define MADNESS_MRA_VMRA_H__INCLUDED


/*!

    \file vmra.h

    \brief Defines operations on vectors of Functions

    \ingroup mra


    This file defines a number of operations on vectors of functions.

    Assume v is a vector of NDIM-D functions of a certain type.


    Operations on array of functions


    *) copying: deep copying of vectors of functions to vector of functions

    \code

    vector2 = copy(world, vector1,fence);

    \endcode


    *) compress: convert multiwavelet representation to legendre representation

    \code

    compress(world, vector, fence);

    \endcode


    *) reconstruct: convert representation to multiwavelets

    \code

    reconstruct(world, vector, fence);

    \endcode


    *) make_nonstandard: convert to non-standard form

    \code

    make_nonstandard(world, v, fence);

    \endcode


    *) standard: convert to standard form

    \code

    standard(world, v, fence);

    \endcode


    *) truncate: truncating vectors of functions to desired precision

    \code

    truncate(world, v, tolerance, fence);

    \endcode


    *) zero function: create a vector of zero functions of length n

    \code

    v=zero(world, n);

    \endcode


    *) transform: transform a representation from one basis to another

    \code

    transform(world, vector, tensor, tolerance, fence )

    \endcode


    Setting thresh-hold for precision


    *) set_thresh: setting a finite thresh-hold for a vector of functions

    \code

    void set_thresh(World& world, std::vector< Function<T,NDIM> >& v, double thresh, bool fence=true);

    \endcode


    Arithmetic Operations on arrays of functions


    *) conjugation: conjugate a vector of complex functions


    *) add

    *) sub

    *) mul

       - mul_sparse

    *) square

    *) gaxpy

    *) apply


    Norms, inner-products, blas-1 like operations on vectors of functions


    *) inner

    *) matrix_inner

    *) norm_tree

    *) normalize

    *) norm2

        - norm2s

    *) scale(world, v, alpha);


*/


#include <madness/mra/mra.h>

#include <madness/mra/derivative.h>

#include <cstdio>


namespace madness {


    /// Compress a vector of functions

    template <typename T, std::size_t NDIM>


    void compress(World& world,

                  const std::vector< Function<T,NDIM> >& v,

          unsigned int blk=1,

                  bool fence=true){


        PROFILE_BLOCK(Vcompress);

        bool must_fence = false;

    unsigned int vvsize = v.size();

        for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

            if (!v[j].is_compressed()) {

          v[j].compress(false);

          must_fence = true;

            }

      }

      if ( blk!=1 && must_fence && fence) world.gop.fence();

    }


        if (fence && must_fence) world.gop.fence();

    }


    /// Reconstruct a vector of functions

    template <typename T, std::size_t NDIM>


    void reconstruct(World& world,

                     const std::vector< Function<T,NDIM> >& v,

             unsigned int blk=1,

                     bool fence=true){ // reconstr

    PROFILE_BLOCK(Vreconstruct);

    bool must_fence = false;

    unsigned int vvsize = v.size();

    for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

        if (v[j].is_compressed()) {

          v[j].reconstruct(false);

          must_fence = true;

        }

      }

      if ( blk!=1 && must_fence && fence) world.gop.fence();

    }


    if (fence && must_fence) world.gop.fence();

    } // reconstr


    /// Generates non-standard form of a vector of functions

    template <typename T, std::size_t NDIM>


      void nonstandard(World& world,

               std::vector< Function<T,NDIM> >& v,

               unsigned int blk=1,

               bool fence=true) { // nonstand

        PROFILE_BLOCK(Vnonstandard);

    unsigned int vvsize = v.size();

        reconstruct(world, v, blk);

    for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

          v[j].make_nonstandard(false, false);

      }

      if ( blk!=1 && fence) world.gop.fence();

    }

    if (fence) world.gop.fence();

    } //nonstand


    /// Generates standard form of a vector of functions


    template <typename T, std::size_t NDIM>


      void standard(World& world,

            std::vector< Function<T,NDIM> >& v,

            unsigned int blk=1,

            bool fence=true){ // standard

    PROFILE_BLOCK(Vstandard);

    unsigned int vvsize = v.size();

    for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

        v[j].standard(false);

      }

      if ( blk!=1 && fence) world.gop.fence();

    }

    if (fence) world.gop.fence();

    } // standard


    /// Truncates a vector of functions

    template <typename T, std::size_t NDIM>


    void truncate(World& world,

                  std::vector< Function<T,NDIM> >& v,

                  double tol=0.0,

          unsigned int blk=1,

                  bool fence=true){ // truncate

    PROFILE_BLOCK(Vtruncate);


    compress(world, v, blk);


    unsigned int vvsize = v.size();

    for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

        v[j].truncate(tol, false);

      }

      if ( blk!=1 && fence) world.gop.fence();

    }

        if (fence) world.gop.fence();

    } //truncate


    /// Applies a derivative operator to a vector of functions


    template <typename T, std::size_t NDIM>

      std::vector< Function<T,NDIM> >


      apply(World& world,

         const Derivative<T,NDIM>& D,

         const std::vector< Function<T,NDIM> >& v,

         const unsigned int blk=1,

         const bool fence=true)

      {

    reconstruct(world, v, blk);

    std::vector< Function<T,NDIM> > df(v.size());


    unsigned int vvsize = v.size();


    for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

        df[j] = D(v[j],false);

      }

      if (blk!= 1 && fence) world.gop.fence();

    }

    if (fence) world.gop.fence();


    return df;

      }


    /// Generates a vector of zero functions


    template <typename T, std::size_t NDIM>

      std::vector< Function<T,NDIM> >


      zero_functions(World& world, int n) {

      PROFILE_BLOCK(Vzero_functions);

      std::vector< Function<T,NDIM> > r(n);

      for (int i=0; i<n; ++i)

    r[i] = Function<T,NDIM>(FunctionFactory<T,NDIM>(world));


      return r;

    }


    /// Transforms a vector of functions according to new[i] = sum[j] old[j]*c[j,i]


    /// Uses sparsity in the transformation matrix --- set small elements to

    /// zero to take advantage of this.


    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> >


      transform(World& world,

        const std::vector< Function<T,NDIM> >& v,

        const Tensor<R>& c,

        unsigned int blki=1,

        unsigned int blkj=1,

        const bool fence=true){


      PROFILE_BLOCK(Vtransformsp);


      typedef TENSOR_RESULT_TYPE(T,R) resultT;


      unsigned int blk = min(blki, blkj);

      unsigned int n = v.size();  // n is the old dimension

      unsigned int m = c.dim(1);  // m is the new dimension

      MADNESS_ASSERT(n==c.dim(0));


      std::vector< Function<resultT,NDIM> > vc = zero_functions_compressed<resultT,NDIM>(world, m);

      compress(world, v, blk);


      for (unsigned int i=0; i<m; i+= blki) {

    for (unsigned int ii=i; ii<std::min(m,(i+1)*blki); ii++) {

      for (unsigned int j=0; j<n; j+= blkj) {

        for (unsigned int jj=j; jj<std::min(n, (j+1)*blkj); jj++)

          if (c(jj,ii) != R(0.0)) vc[ii].gaxpy(1.0,v[jj],c(jj,ii),false);

        if (fence && (blkj!=1)) world.gop.fence();

      }

    }

    if (fence && (blki!=1)) world.gop.fence();  // a bit conservative

      }


      //      for (unsigned int i=0; i<m; ++i) {

      // for (unsigned int j=0; j<n; ++j) {

      // if (c(j,i) != R(0.0)) vc[i].gaxpy(1.0,v[j],c(j,i),false);

      // }

      // }


      if (fence) world.gop.fence();

      return vc;

    }


    template <typename L, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(L,R),NDIM> >


      transform(World& world,

        const std::vector< Function<L,NDIM> >& v,

        const Tensor<R>& c,

        const double tol,

        const unsigned int blki=1,

        const bool fence)

      {

        PROFILE_BLOCK(Vtransform);

        MADNESS_ASSERT(v.size() == (unsigned int)(c.dim(0)));


        std::vector< Function<TENSOR_RESULT_TYPE(L,R),NDIM> > vresult(c.dim(1));

    unsigned int m=c.dim(1);


    for (unsigned int i=0; i<m; i+= blki) {

      for (unsigned int ii=i; ii<std::min(m,(i+1)*blki); ii++) {

        vresult[ii] = Function<TENSOR_RESULT_TYPE(L,R),NDIM>(FunctionFactory<TENSOR_RESULT_TYPE(L,R),NDIM>(world));

      }

      if (fence && (blki!=1)) world.gop.fence();  // a bit conservative

    }


    //        for (unsigned int i=0; i<c.dim(1); ++i) {

    // vresult[i] = Function<TENSOR_RESULT_TYPE(L,R),NDIM>(FunctionFactory<TENSOR_RESULT_TYPE(L,R),NDIM>(world));

    // }

        compress(world, v, blki, false);

        compress(world, vresult, blki, false);

        world.gop.fence();

        vresult[0].vtransform(v, c, vresult, tol, fence);

        return vresult;

      }


    /// Scales inplace a vector of functions by distinct values


    template <typename T, typename Q, std::size_t NDIM>


      void scale(World& world,

         std::vector< Function<T,NDIM> >& v,

         const std::vector<Q>& factors,

         const unsigned int blk=1,

         const bool fence=true)

      {

    PROFILE_BLOCK(Vscale);


    unsigned int vvsize = v.size();

    for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

        v[j].scale(factors[j],false);

      }

      if (fence && blk!=1 ) world.gop.fence();

    }

    if (fence) world.gop.fence();

      }


    /// Scales inplace a vector of functions by the same


    template <typename T, typename Q, std::size_t NDIM>


      void scale(World& world,

         std::vector< Function<T,NDIM> >& v,

          const Q factor,

         const unsigned int blk=1,

         const bool fence=true){


    PROFILE_BLOCK(Vscale); // shouldn't need blocking since it is local


    unsigned int vvsize = v.size();

    for (unsigned int i=0; i<vvsize; i+= blk) {

      for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

        v[j].scale(factor,false);

      }

      if (fence && blk!=1 ) world.gop.fence();

    }

    if (fence) world.gop.fence();

      }


    /// Computes the 2-norms of a vector of functions

    template <typename T, std::size_t NDIM>


      std::vector<double> norm2s(World& world,

                 const std::vector< Function<T,NDIM> >& v,

                 const unsigned int blk=1,

                 const bool fence=true){


      PROFILE_BLOCK(Vnorm2);

      unsigned int vvsize = v.size();

      std::vector<double> norms(vvsize);


      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

      norms[j] = v[j].norm2sq_local();

    }

    if (fence && (blk!=1)) world.gop.fence();

      }

      if (fence ) world.gop.fence();


      world.gop.sum(&norms[0], norms.size());


      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      norms[j] = sqrt(norms[j]);

    if (fence && (blk!=1)) world.gop.fence();

      }


      world.gop.fence();

      return norms;

    }


    /// Computes the 2-norm of a vector of functions

    // should be local; norms[0] contains the result


    template <typename T, std::size_t NDIM>

      double norm2(World& world,

           const std::vector< Function<T,NDIM> >& v)

      {


    PROFILE_BLOCK(Vnorm2);


    std::vector<double> norms(v.size());


    for (unsigned int i=0; i<v.size(); ++i)

      norms[i] = v[i].norm2sq_local();


    world.gop.sum(&norms[0], norms.size());


    for (unsigned int i=1; i<v.size(); ++i)

      norms[0] += norms[i];


    world.gop.fence();

    return sqrt(norms[0]);

      }


    inline double conj(double x) {

      return x;

    }


    inline double conj(float x) {

      return x;

    }


    template <typename T, typename R, std::size_t NDIM>


    struct MatrixInnerTask : public TaskInterface {

        Tensor<TENSOR_RESULT_TYPE(T,R)> result; // Must be a copy

        const Function<T,NDIM>& f;

        const std::vector< Function<R,NDIM> >& g;

        long jtop;


        MatrixInnerTask(const Tensor<TENSOR_RESULT_TYPE(T,R)>& result,

                const Function<T,NDIM>& f,

                const std::vector< Function<R,NDIM> >& g,

                long jtop)

        : result(result), f(f), g(g), jtop(jtop) {}


        void run(World& world) {

            for (long j=0; j<jtop; ++j) {

                result(j) = f.inner_local(g[j]);

            }

        }


    private:

        /// Get the task id


        /// \param id The id to set for this task


        virtual void get_id(std::pair<void*,unsigned short>& id) const {

            PoolTaskInterface::make_id(id, *this);

        }


    }; // struct MatrixInnerTask


    /// Computes the matrix inner product of two function vectors - q(i,j) = inner(f[i],g[j])


    /// For complex types symmetric is interpreted as Hermitian.

    ///

    /// The current parallel loop is non-optimal but functional.


    template <typename T, typename R, std::size_t NDIM>

      Tensor< TENSOR_RESULT_TYPE(T,R) > matrix_inner(World& world,

                             const std::vector< Function<T,NDIM> >& f,

                             const std::vector< Function<R,NDIM> >& g,

                             bool sym=false) {

      PROFILE_BLOCK(Vmatrix_inner);

      unsigned int n=f.size(), m=g.size();

      Tensor< TENSOR_RESULT_TYPE(T,R) > r(n,m);

      if (sym) MADNESS_ASSERT(n==m);


      world.gop.fence();

      compress(world, f);

      if (&f != &g) compress(world, g);


      //         for (long i=0; i<n; ++i) {

      //             long jtop = m;

      //             if (sym) jtop = i+1;

      //             for (long j=0; j<jtop; ++j) {

      //                 r(i,j) = f[i].inner_local(g[j]);

      //                 if (sym) r(j,i) = conj(r(i,j));

      //             }

      //         }


      for (unsigned int i=n-1; i>=0; --i) {

    unsigned int jtop = m;

    if (sym) jtop = i+1;

    world.taskq.add(new MatrixInnerTask<T,R,NDIM>(r(i,_), f[i], g, jtop));

      }

      world.gop.fence();

      world.gop.sum(r.ptr(),n*m);


      if (sym) {

    for (unsigned int i=0; i<n; ++i) {

      for (unsigned int j=0; j<i; ++j) {

        r(j,i) = conj(r(i,j));

      }

    }

      }

      return r;

    }


    /// Computes the element-wise inner product of two function vectors - q(i) = inner(f[i],g[i])


    template <typename T, typename R, std::size_t NDIM>

      Tensor< TENSOR_RESULT_TYPE(T,R) > inner(World& world,

                          const std::vector< Function<T,NDIM> >& f,

                          const std::vector< Function<R,NDIM> >& g) {

      PROFILE_BLOCK(Vinnervv);

      long n=f.size(), m=g.size();

      MADNESS_ASSERT(n==m);

      Tensor< TENSOR_RESULT_TYPE(T,R) > r(n);


      compress(world, f);

      compress(world, g);


      for (long i=0; i<n; ++i) {

    r(i) = f[i].inner_local(g[i]);

      }


      world.taskq.fence();

      world.gop.sum(r.ptr(),n);

      world.gop.fence();

      return r;

    }


    /// Computes the inner product of a function with a function vector - q(i) = inner(f,g[i])


    template <typename T, typename R, std::size_t NDIM>

      Tensor< TENSOR_RESULT_TYPE(T,R) > inner(World& world,

                          const Function<T,NDIM>& f,

                          const std::vector< Function<R,NDIM> >& g) {

      PROFILE_BLOCK(Vinner);

      long n=g.size();

      Tensor< TENSOR_RESULT_TYPE(T,R) > r(n);


      f.compress();

      compress(world, g);


      for (long i=0; i<n; ++i) {

    r(i) = f.inner_local(g[i]);

      }


      world.taskq.fence();

      world.gop.sum(r.ptr(),n);

      world.gop.fence();

      return r;

    }


    /// Multiplies a function against a vector of functions --- q[i] = a * v[i]


    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      mul(World& world,

      const Function<T,NDIM>& a,

      const std::vector< Function<R,NDIM> >& v,

      const unsigned int blk=1,

      const bool fence=true) {


      PROFILE_BLOCK(Vmul);

      a.reconstruct(false);

      reconstruct(world, v, blk, false);

      world.gop.fence();

      return vmulXX(a, v, 0.0, fence);

    }


    /// Multiplies a function against a vector of functions using sparsity of a and v[i] --- q[i] = a * v[i]

    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      mul_sparse(World& world,

         const Function<T,NDIM>& a,

         const std::vector< Function<R,NDIM> >& v,

         const double tol,

         const bool fence=true,

         const unsigned int blk=1)

 {

      PROFILE_BLOCK(Vmulsp);

      a.reconstruct(false);

      reconstruct(world, v, blk, false);

      world.gop.fence();


      unsigned int vvsize = v.size();

      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      v[j].norm_tree(false);

    if ( fence && (blk == 1)) world.gop.fence();

      }

      a.norm_tree();

      return vmulXX(a, v, tol, fence);

    }


    /// Makes the norm tree for all functions in a vector

    template <typename T, std::size_t NDIM>


      void norm_tree(World& world,

             const std::vector< Function<T,NDIM> >& v,

             bool fence=true,

             unsigned int blk=1){

        PROFILE_BLOCK(Vnorm_tree);


      unsigned int vvsize = v.size();

      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      v[j].norm_tree(false);

        if (fence && blk!=1 ) world.gop.fence();

      }

      if (fence) world.gop.fence();

    }


    /// Multiplies two vectors of functions q[i] = a[i] * b[i]


    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      mul(World& world,

      const std::vector< Function<T,NDIM> >& a,

      const std::vector< Function<R,NDIM> >& b,

      bool fence=true,

      unsigned int blk=1){

      PROFILE_BLOCK(Vmulvv);

      reconstruct(world, a, blk, false);

      if (&a != &b) reconstruct(world, b, blk, false);

      world.gop.fence();


      std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > q(a.size());


      unsigned int vvsize = a.size();

      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      q[j] = mul(a[j], b[j], false);

    if (fence && (blk !=1 )) world.gop.fence();

      }

      if (fence) world.gop.fence();

      return q;

    }


    /// Computes the square of a vector of functions --- q[i] = v[i]**2


    template <typename T, std::size_t NDIM>

      std::vector< Function<T,NDIM> >

      square(World& world,

         const std::vector< Function<T,NDIM> >& v,

         bool fence=true) {

      return mul<T,T,NDIM>(world, v, v, fence);

      //         std::vector< Function<T,NDIM> > vsq(v.size());

      //         for (unsigned int i=0; i<v.size(); ++i) {

      //             vsq[i] = square(v[i], false);

      //         }

      //         if (fence) world.gop.fence();

      //         return vsq;

    }


    /// Sets the threshold in a vector of functions


    template <typename T, std::size_t NDIM>

      void set_thresh(World& world,

              std::vector< Function<T,NDIM> >& v,

              double thresh,

              bool fence=true) {

      for (unsigned int j=0; j<v.size(); ++j) {

    v[j].set_thresh(thresh,false);

      }

      if (fence) world.gop.fence();

    }


    /// Returns the complex conjugate of the vector of functions


    template <typename T, std::size_t NDIM>

      std::vector< Function<T,NDIM> >

      conj(World& world,

       const std::vector< Function<T,NDIM> >& v,

       bool fence=true){

      PROFILE_BLOCK(Vconj);

      std::vector< Function<T,NDIM> > r = copy(world, v); // Currently don't have oop conj

      for (unsigned int i=0; i<v.size(); ++i) {

    r[i].conj(false);

      }

      if (fence) world.gop.fence();

      return r;

    }


    /// Returns a deep copy of a vector of functions


    template <typename T, std::size_t NDIM>

      std::vector< Function<T,NDIM> >

      copy(World& world,

       const std::vector< Function<T,NDIM> >& v,

       bool fence=true) {

      PROFILE_BLOCK(Vcopy);

      std::vector< Function<T,NDIM> > r(v.size());

      for (unsigned int i=0; i<v.size(); ++i) {

    r[i] = copy(v[i], false);

      }

      if (fence) world.gop.fence();

      return r;

    }


    /// Returns a vector of deep copies of of a function


    template <typename T, std::size_t NDIM>

      std::vector< Function<T,NDIM> >

      copy(World& world,

       const Function<T,NDIM>& v,

       const unsigned int n,

       bool fence=true) {

      PROFILE_BLOCK(Vcopy1);

      std::vector< Function<T,NDIM> > r(n);

      for (unsigned int i=0; i<n; ++i) {

    r[i] = copy(v, false);

      }

      if (fence) world.gop.fence();

      return r;

    }


    /// Returns new vector of functions --- q[i] = a[i] + b[i]


    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      add(World& world,

      const std::vector< Function<T,NDIM> >& a,

      const std::vector< Function<R,NDIM> >& b,

      bool fence=true,

      unsigned int blk=1) {

      PROFILE_BLOCK(Vadd);

      MADNESS_ASSERT(a.size() == b.size());

      compress(world, a, blk);

      compress(world, b, blk);


      std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > r(a.size());


      unsigned int vvsize = a.size();

      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      r[j] = add(a[j], b[j], false);

    if (fence && (blk !=1 )) world.gop.fence();

      }

      if (fence) world.gop.fence();


      return r;

    }


     /// Returns new vector of functions --- q[i] = a + b[i]


    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      add(World& world,

      const Function<T,NDIM> & a,

      const std::vector< Function<R,NDIM> >& b,

       bool fence=true,

      unsigned int blk=1) {


      PROFILE_BLOCK(Vadd1);

      a.compress();

      compress(world, b, blk);


      std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > r(b.size());


      unsigned int vvsize = b.size();

      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      r[j] = add(a, b[j], false);

    if (fence && (blk !=1 )) world.gop.fence();

      }

      if (fence) world.gop.fence();


      return r;

    }


    template <typename T, typename R, std::size_t NDIM>

      inline std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      add(World& world,

      const std::vector< Function<R,NDIM> >& b,

      const Function<T,NDIM> & a,

       bool fence=true,

      unsigned int blk=1) {

      return add(world, a, b, fence, blk);

    }


    /// Returns new vector of functions --- q[i] = a[i] - b[i]


    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      sub(World& world,

       const std::vector< Function<T,NDIM> >& a,

       const std::vector< Function<R,NDIM> >& b,

       bool fence=true,

       unsigned int blk=1) {

      PROFILE_BLOCK(Vsub);

      MADNESS_ASSERT(a.size() == b.size());

      compress(world, a, fence, blk);

      compress(world, b, fence, blk);


      std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > r(a.size());


      unsigned int vvsize = a.size();

      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      r[j] = sub(a[j], b[j], false);

    if (fence && (blk !=1 )) world.gop.fence();

      }

      if (fence) world.gop.fence();

      return r;

    }


    /// Generalized A*X+Y for vectors of functions ---- a[i] = alpha*a[i] + beta*b[i]


    template <typename T, typename Q, typename R, std::size_t NDIM>


      void gaxpy(World& world,

         Q alpha,

         std::vector< Function<T,NDIM> >& a,

         Q beta,

         const std::vector< Function<R,NDIM> >& b,

         unsigned int blk=1,

         bool fence=true) {

      PROFILE_BLOCK(Vgaxpy);

      MADNESS_ASSERT(a.size() == b.size());

      compress(world, a, fence, blk);

      compress(world, b, fence, blk);


      unsigned int vvsize = a.size();


      for (unsigned int i=0; i<vvsize; i+= blk) {

    for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

      a[j].gaxpy(alpha, b[j], beta, false);


    if (fence && (blk !=1 )) world.gop.fence();


      }

      //      for (unsigned int i=0; i<a.size(); ++i) {

      //    a[i].gaxpy(alpha, b[i], beta, false);

      // }

      if (fence) world.gop.fence();

    }


    /// Applies a vector of operators to a vector of functions --- q[i] = apply(op[i],f[i])


    template <typename opT, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(typename opT::opT,R), NDIM> >


      apply(World& world,

        const std::vector< std::shared_ptr<opT> >& op,

        const std::vector< Function<R,NDIM> > f,

        const unsigned int blk=1){


      PROFILE_BLOCK(Vapplyv);

      MADNESS_ASSERT(f.size()==op.size());


      std::vector< Function<R,NDIM> >& ncf = *const_cast< std::vector< Function<R,NDIM> >* >(&f);


      reconstruct(world, f, blk);

      nonstandard(world, ncf, blk);


      std::vector< Function<TENSOR_RESULT_TYPE(typename opT::opT,R), NDIM> > result(f.size());

      unsigned int ff = f.size();


      for (unsigned int i=0; i<ff; ++blk) {

    for (unsigned int j=i; j<std::min(ff,(i+1)*blk); ++j)

      result[j] = apply_only(*op[j], f[j], false);

    if (blk !=1)

      world.gop.fence();

      }


      world.gop.fence();


      standard(world, ncf, false);  // restores promise of logical constness

      world.gop.fence();

      reconstruct(world, result, blk);


      return result;

    }


    /// Applies an operator to a vector of functions --- q[i] = apply(op,f[i])


    template <typename T, typename R, std::size_t NDIM>

      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >


      apply(World& world,

        const SeparatedConvolution<T,NDIM>& op,

        const std::vector< Function<R,NDIM> > f,

        const unsigned int blk=1) {

      PROFILE_BLOCK(Vapply);


      std::vector< Function<R,NDIM> >& ncf = *const_cast< std::vector< Function<R,NDIM> >* >(&f);


      reconstruct(world, f, blk);

      nonstandard(world, ncf, blk);


      std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> > result(f.size());


      unsigned int ff = f.size();

      for (unsigned int i=0; i<ff; ++blk) {

    for (unsigned int j=i; j<std::min(ff,(i+1)*blk); ++j)

      result[j] = apply_only(op, f[j], false);

    if (blk !=1)

      world.gop.fence();

      }

      world.gop.fence();


      standard(world, ncf, blk, false);  // restores promise of logical constness

      world.gop.fence();

      reconstruct(world, result, blk);


      return result;

    }


    /// Normalizes a vector of functions --- v[i] = v[i].scale(1.0/v[i].norm2())


    template <typename T, std::size_t NDIM>

      void normalize(World& world,

             std::vector< Function<T,NDIM> >& v,

             bool fence=true){


      PROFILE_BLOCK(Vnormalize);

      std::vector<double> nn = norm2s(world, v);


      for (unsigned int i=0; i<v.size(); ++i)

    v[i].scale(1.0/nn[i],false);


      if (fence) world.gop.fence();

    }


}

#endif // MADNESS_MRA_VMRA_H__INCLUDED

q
double q(double t)
Definition DKops.h:18

madness::BaseTensor::size
long size() const
Returns the number of elements in the tensor.
Definition basetensor.h:138

madness::Derivative
Implements derivatives operators with variety of boundary conditions on simulation domain.
Definition derivative.h:266

madness::FunctionFactory
FunctionFactory implements the named-parameter idiom for Function.
Definition function_factory.h:86

madness::Function
A multiresolution adaptive numerical function.
Definition mra.h:139

madness::PoolTaskInterface::make_id
static std::enable_if< detail::function_traits< fnT >::value||detail::memfunc_traits< fnT >::value >::type make_id(std::pair< void *, unsigned short > &id, fnT fn)
Definition thread.h:922

madness::SeparatedConvolution
Convolutions in separated form (including Gaussian)
Definition operator.h:139

madness::TaskInterface
All world tasks must be derived from this public interface.
Definition taskfn.h:69

madness::TaskInterface::world
volatile World * world
Definition taskfn.h:72

madness::Tensor
A tensor is a multidimensional array.
Definition tensor.h:317

madness::WorldGopInterface::fence
void fence(bool debug=false)
Synchronizes all processes in communicator AND globally ensures no pending AM or tasks.
Definition worldgop.cc:161

madness::WorldGopInterface::sum
void sum(T *buf, size_t nelem)
Inplace global sum while still processing AM & tasks.
Definition worldgop.h:872

madness::World
A parallel world class.
Definition world.h:132

madness::World::gop
WorldGopInterface & gop
Global operations.
Definition world.h:207

R
static const double R
Definition csqrt.cc:46

derivative.h
Declaration and initialization of tree traversal functions and generic derivative.

T
auto T(World &world, response_space &f) -> response_space
Definition global_functions.cc:34

beta
const double beta
Definition gygi_soltion.cc:62

v
static const double v
Definition hatom_sf_dirac.cc:20

op
Tensor< double > op(const Tensor< double > &x)
Definition kain.cc:508

MADNESS_ASSERT
#define MADNESS_ASSERT(condition)
Assert a condition that should be free of side-effects since in release builds this might be a no-op.
Definition madness_exception.h:134

mra.h
Main include file for MADNESS and defines Function interface.

madness
Namespace for all elements and tools of MADNESS.
Definition DFParameters.h:10

madness::square
Function< T, NDIM > square(const Function< T, NDIM > &f, bool fence=true)
Create a new function that is the square of f - global comm only if not reconstructed.
Definition mra.h:2746

madness::scale
response_space scale(response_space a, double b)

madness::sub
Function< TENSOR_RESULT_TYPE(L, R), NDIM > sub(const Function< L, NDIM > &left, const Function< R, NDIM > &right, bool fence=true)
Same as operator- but with optional fence and no automatic compression.
Definition mra.h:2035

madness::norm2s
std::vector< double > norm2s(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norms of a vector of functions.
Definition vmra.h:845

madness::mul
Function< TENSOR_RESULT_TYPE(Q, T), NDIM > mul(const Q alpha, const Function< T, NDIM > &f, bool fence=true)
Returns new function equal to alpha*f(x) with optional fence.
Definition mra.h:1765

madness::truncate
void truncate(World &world, response_space &v, double tol, bool fence)
Definition basic_operators.cc:30

madness::norm_tree
void norm_tree(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Makes the norm tree for all functions in a vector.
Definition vmra.h:1181

madness::transform
std::vector< Function< TENSOR_RESULT_TYPE(T, R), NDIM > > transform(World &world, const std::vector< Function< T, NDIM > > &v, const Tensor< R > &c, bool fence=true)
Transforms a vector of functions according to new[i] = sum[j] old[j]*c[j,i].
Definition vmra.h:707

madness::nonstandard
@ nonstandard
s and d coeffs in internal nodes
Definition funcdefaults.h:62

madness::conj
Function< T, NDIM > conj(const Function< T, NDIM > &f, bool fence=true)
Return the complex conjugate of the input function with the same distribution and optional fence.
Definition mra.h:2110

madness::standard
void standard(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Generates standard form of a vector of functions.
Definition vmra.h:243

madness::compress
void compress(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Compress a vector of functions.
Definition vmra.h:149

madness::reconstruct
const std::vector< Function< T, NDIM > > & reconstruct(const std::vector< Function< T, NDIM > > &v)
reconstruct a vector of functions
Definition vmra.h:162

madness::set_thresh
void set_thresh(World &world, std::vector< Function< T, NDIM > > &v, double thresh, bool fence=true)
Sets the threshold in a vector of functions.
Definition vmra.h:1285

madness::norm2
double norm2(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norm of a vector of functions.
Definition vmra.h:871

madness::_
static const Slice _(0,-1, 1)

madness::mul_sparse
Function< TENSOR_RESULT_TYPE(L, R), NDIM > mul_sparse(const Function< L, NDIM > &left, const Function< R, NDIM > &right, double tol, bool fence=true)
Sparse multiplication — left and right must be reconstructed and if tol!=0 have tree of norms already...
Definition mra.h:1806

madness::apply
response_space apply(World &world, std::vector< std::vector< std::shared_ptr< real_convolution_3d > > > &op, response_space &f)
Definition basic_operators.cc:39

madness::f
NDIM & f
Definition mra.h:2481

madness::add
Function< TENSOR_RESULT_TYPE(L, R), NDIM > add(const Function< L, NDIM > &left, const Function< R, NDIM > &right, bool fence=true)
Same as operator+ but with optional fence and no automatic compression.
Definition mra.h:1991

madness::g
NDIM const Function< R, NDIM > & g
Definition mra.h:2481

madness::apply_only
Function< TENSOR_RESULT_TYPE(typename opT::opT, R), NDIM > apply_only(const opT &op, const Function< R, NDIM > &f, bool fence=true)
Apply operator ONLY in non-standard form - required other steps missing !!
Definition mra.h:2184

madness::inner
double inner(response_space &a, response_space &b)
Definition response_functions.h:442

madness::vmulXX
std::vector< Function< TENSOR_RESULT_TYPE(L, R), D > > vmulXX(const Function< L, D > &left, const std::vector< Function< R, D > > &vright, double tol, bool fence=true)
Use the vmra/mul(...) interface instead.
Definition mra.h:1871

madness::normalize
void normalize(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Normalizes a vector of functions — v[i] = v[i].scale(1.0/v[i].norm2())
Definition vmra.h:1810

madness::zero_functions
std::vector< Function< T, NDIM > > zero_functions(World &world, int n, bool fence=true)
Generates a vector of zero functions (reconstructed)
Definition vmra.h:416

madness::matrix_inner
void matrix_inner(DistributedMatrix< T > &A, const std::vector< Function< T, NDIM > > &f, const std::vector< Function< T, NDIM > > &g, bool sym=false)
Definition distpm.cc:46

madness::copy
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence.
Definition mra.h:2066

madness::gaxpy
void gaxpy(const double a, ScalarResult< T > &left, const double b, const T &right, const bool fence=true)
the result type of a macrotask must implement gaxpy
Definition macrotaskq.h:245

b
static const double b
Definition nonlinschro.cc:119

a
static const double a
Definition nonlinschro.cc:118

Q
double Q(double a)
Definition relops.cc:20

c
static const double c
Definition relops.cc:10

m
static const double m
Definition relops.cc:9

L
static const double L
Definition rk.cc:46

thresh
static const double thresh
Definition rk.cc:45

D
Definition test_ar.cc:204

madness::MatrixInnerTask
Definition vmra1.h:463

madness::MatrixInnerTask::get_id
virtual void get_id(std::pair< void *, unsigned short > &id) const
Get the task id.
Definition vmra1.h:485

madness::MatrixInnerTask::g
const std::vector< Function< R, NDIM > > & g
Definition vmra1.h:466

madness::MatrixInnerTask::MatrixInnerTask
MatrixInnerTask(const Tensor< TENSOR_RESULT_TYPE(T, R)> &result, const Function< T, NDIM > &f, const std::vector< Function< R, NDIM > > &g, long jtop)
Definition vmra1.h:469

madness::MatrixInnerTask::f
const Function< T, NDIM > & f
Definition vmra1.h:465

madness::MatrixInnerTask::result
Tensor< TENSOR_RESULT_TYPE(T, R)> result
Definition vmra1.h:464

madness::MatrixInnerTask::run
void run(World &world)
Runs a single-threaded task ... derived classes must implement this.
Definition vmra1.h:475

madness::MatrixInnerTask::jtop
long jtop
Definition vmra1.h:467

ncf
Definition dirac-hatom.cc:108

alpha
static const double alpha
Definition testcosine.cc:10

NDIM
constexpr std::size_t NDIM
Definition testgconv.cc:54

TENSOR_RESULT_TYPE
#define TENSOR_RESULT_TYPE(L, R)
This macro simplifies access to TensorResultType.
Definition type_data.h:205

PROFILE_BLOCK
#define PROFILE_BLOCK(name)
Definition worldprofile.h:208