madness/api-doc/tensoriter_8h_source.html

/*

  This file is part of MADNESS.


  Copyright (C) 2007,2010 Oak Ridge National Laboratory


  This program is free software; you can redistribute it and/or modify

  it under the terms of the GNU General Public License as published by

  the Free Software Foundation; either version 2 of the License, or

  (at your option) any later version.


  This program is distributed in the hope that it will be useful,

  but WITHOUT ANY WARRANTY; without even the implied warranty of

  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

  GNU General Public License for more details.


  You should have received a copy of the GNU General Public License

  along with this program; if not, write to the Free Software

  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA


  For more information please contact:


  Robert J. Harrison

  Oak Ridge National Laboratory

  One Bethel Valley Road

  P.O. Box 2008, MS-6367


  email: harrisonrj@ornl.gov

  tel:   865-241-3937

  fax:   865-572-0680


  $Id$

*/


#ifndef MADNESS_TENSOR_TENSORITER_H__INCLUDED

#define MADNESS_TENSOR_TENSORITER_H__INCLUDED


/// \file tensoriter.h

/// \brief Declares TensorIterator


#include <madness/tensor/tensor.h>

#include <madness/tensor/tensorexcept.h>


#include <iostream>

#include <algorithm>

#include <complex>


#include <cmath>


namespace madness {


    template <class T> class Tensor;

    template <class T> class SliceTensor;


    static const long default_jdim = 5551212; // Never a valid dimension num.


    /// Optimized iterator for tensors supporting unary, binary and ternary operations.

    /// \ingroup tensor


    template <class T, class Q = T, class R = T> class TensorIterator {

        T* _p0_save;

        Q* _p1_save;

        R* _p2_save;

    public:

        T* _p0;

        Q* _p1;

        R* _p2;

        long ndim;

        long dimj;

        long _s0;

        long _s1;

        long _s2;

        long dim[TENSOR_MAXDIM];

        long ind[TENSOR_MAXDIM];

        long stride0[TENSOR_MAXDIM];

        long stride1[TENSOR_MAXDIM];

        long stride2[TENSOR_MAXDIM];


        TensorIterator(const Tensor<T>* t0, const Tensor<Q>* t1=0, const Tensor<R>* t2=0,

                       long iterlevel=0,

                       bool optimize=true, bool fusedim=true,

                       long jdim=default_jdim);


        TensorIterator<T,Q,R>& operator++();


        inline bool operator == (const TensorIterator<T,Q,R>& a) const {

            return _p0==a._p0;

        }


        inline bool operator != (const TensorIterator<T,Q,R>& a) const {

            return _p0!=a._p0;

        }


        inline TensorIterator<T,Q,R>* operator->() {

            return this;

        };


        inline T& operator*() const {

            return *_p0;

        };


        void reset();


        void reuse(const Tensor<T>* t0, const Tensor<Q>* t1=0, const Tensor<R>* t2=0);

    };


    /// Constructor for general iterator to compose operations over up to three tensors


    /// \ingroup tensor

    /// Macros have been defined in \c tensor_macros.h to take the pain out of

    /// using iterators.  The options have the following effects

    /// - \c optimize reorders dimensions for optimal strides (only

    /// applies if iterlevel=1).  If jdim==default_jdim, all dimensions

    /// are reordered for optimal stride.  If jdim is not the default

    /// value, then dimension jdim is excluded from the set of

    /// dimensions being optimized.

    ///

    /// - \c fusedim concatenates contiguous dimensions into the inner

    /// loop (only applies if iterlevel=1 and jdim=default_jdim).

    ///

    /// - \c iterlevel can have two values 0=elementwise, 1=vectorwise.  Elementwise implies

    /// that the iterator returns successive elements, and explicitly

    /// in the expected order for the tensor (i.e., with the last index

    /// varying fastest).  Vectorwise implies that the user is responsible

    /// for iterating over dimension jdim.

    ///

    /// - jdim --- if iterlevel=1, then jdim determines which dimension is

    /// left for iteration with an explicit for loop.  Negative values

    /// implies jdim+=ndim following the convention of Slice (and

    /// Python).  If (optimize) the default is the fastest varying

    /// dimension.  If (!optimize) the default is the last dimension

    /// (jdim=-1). If (fusedim) contiguous dimensions are fused into

    /// this inner loop.  Specifying a non-default value for jdim

    /// disables fusedim and restricts optimization to reordering only

    /// the exterior loops (so that the loop the user is iterating over

    /// corresponds exactly to those in dimension jdim).

    ///

    /// \par During iteration:

    ///

    /// - \c ind[] will contain the current iteration indices .. BUT

    /// if \c optimize=true , they will not necessarily be in the

    /// order of those of the tensor.  if fusedim is true, then

    /// there may be fewer dimensions than the input tensor.

    ///

    /// - \c _p0, \c _p1, \c _p2 will point to the current elements of \c t0,t1,t2

    /// noting that if \c iterlevel>0, the user must provide additional

    /// \c for loops to iterate over the additional dimensions

    ///

    /// - \c stride0[], \c stride1[], \c stride2[] will contain the strides for each

    /// (possibly reordered) dimension.  If \c iterlevel=1, \c _s0,_s1,s2

    /// contain the stride info for the dimension that the user is

    /// responsible for iterating over.

    ///

    /// - \c dimj -> the size of the j'th dimension

    template <class T, class Q, class R>


    TensorIterator<T,Q,R>::TensorIterator(const Tensor<T>* t0,

                                          const Tensor<Q>* t1,

                                          const Tensor<R>* t2,

                                          long iterlevel,

                                          bool optimize,

                                          bool fusedim,

                                          long jdim) {


        if (!t0) {

            // Used to indicate end of iteration.

            _p0 = 0;

            return;

        }


        //std::printf("t0=%p t1=%p t2=%p optimize=%d fusedim=%d iterlevel=%ld jdim=%ld\n",

        //t0,t1,t2,optimize,fusedim,iterlevel,jdim);


        TENSOR_ASSERT(iterlevel==0 || iterlevel==1,"invalid iteration level",iterlevel,t0);


        // First copy basic info over

        ndim = t0->ndim();

        _p0_save = _p0 = const_cast<T*>(t0->ptr()); // CONSTNESS VIOLATION

        for (int i=0; i<ndim; ++i) {

            dim[i] = t0->dim(i);

            stride0[i] = t0->stride(i);

        }

        if (t1) {

            TENSOR_ASSERT(t0->conforms(*t1),"first and second tensors do not conform",

                          0, t0);

            _p1_save = _p1 = const_cast<Q*>(t1->ptr()); // CONSTNESS VIOLATION

            for (int i=0; i<ndim; ++i) stride1[i] = t1->stride(i);

        }

        else {

            _p1_save = _p1 = 0;

        }

        if (t2) {

            TENSOR_ASSERT(t0->conforms(*t2),"first and third tensors do not conform",

                          0, t0);

            _p2_save = _p2 = const_cast<R*>(t2->ptr()); // CONSTNESS VIOLATION

            for (int i=0; i<ndim; ++i) stride2[i] = t2->stride(i);

        }

        else {

            _p2_save = _p2 = 0;

        }


        if (iterlevel == 0) {

            // Iteration will include all dimensions

            fusedim = false;

            jdim = ndim;

            dimj = 0;

            _s0 = 0;

            _s1 = 0;

            _s2 = 0;

        }

        else if (iterlevel == 1) {

            // Apply -ve indexing convention for dimensions

            if (jdim < 0) jdim += ndim;


            // If permissible optimize the order of dimensions excluding

            // any non-default value of jdim.

            if (optimize) {

                for (int i=0; i<ndim; ++i) {

                    if (i != jdim) {

                        for (int j=i; j<ndim; ++j) {

                            if (j != jdim) {

                                if (std::abs(stride0[i]) < std::abs(stride0[j])) {

                                    std::swap(stride0[i],stride0[j]);

                                    if (t1) std::swap(stride1[i],stride1[j]);

                                    if (t2) std::swap(stride2[i],stride2[j]);

                                    std::swap(dim[i],dim[j]);

                                }

                            }

                        }

                    }

                    //std::cout << "stride0[" << i << "]=" << stride0[i] << std::endl;

                }

            }


            // Iterations will exclude dimension jdim, default is last one

            if (jdim == default_jdim) {

                jdim = ndim-1;

            }

            else {

                fusedim = false;

            }

            TENSOR_ASSERT(jdim>=0 && jdim < ndim, "invalid index for external iteration",

                          jdim, t0);

            ndim--;


            // Stride and dimension info for the excluded dimension

            _s0 = stride0[jdim];

            if (t1) {

                _s1 = stride1[jdim];

            }

            else {

                _s1 = 0;

            }

            if (t2) {

                _s2 = stride2[jdim];

            }

            else {

                _s2 = 0;

            }

            dimj = dim[jdim];


            // Collapse stride and dimension info for remaining dimensions

            for (int i=jdim+1; i<=ndim; ++i) { // GCC COMPILER WARNING ... but need <= ... why?

                dim[i-1] = dim[i];

                stride0[i-1] = stride0[i];

            }

            if (t1) {

                for (int i=jdim+1; i<=ndim; ++i) stride1[i-1] = stride1[i]; //  GCC COMPILER WARNING ... but need <= ... why?

            }

            if (t2) {

                for (int i=jdim+1; i<=ndim; ++i) stride2[i-1] = stride2[i]; //  GCC COMPILER WARNING ... but need <= ... why?

            }


            if (fusedim) {      // Only if jdim=default_jdim && iterlevel=1

                if (t2) {

                    for (int i=ndim-1; i>=0; --i) {

                        if (_s0*dimj == stride0[i] &&

                                _s1*dimj == stride1[i] &&

                                _s2*dimj == stride2[i]) {

                            dimj *= dim[i];

                            ndim--;

                        }

                        else {

                            break;

                        }

                    }

                }

                else if (t1) {

                    for (int i=ndim-1; i>=0; --i) {

                        if (_s0*dimj == stride0[i] &&

                                _s1*dimj == stride1[i]) {

                            dimj *= dim[i];

                            ndim--;

                        }

                        else {

                            break;

                        }

                    }

                }

                else {

                    for (int i=ndim-1; i>=0; --i) {

                        if (_s0*dimj == stride0[i]) {

                            dimj *= dim[i];

                            ndim--;

                        }

                        else {

                            break;

                        }

                    }

                }

            }

        }


        // Initialize indices for the counter Use TENSOR_MAXDIM so reference to

        // optimized-away dimensions is vaguely meaningful.

        for (int i=0; i<TENSOR_MAXDIM; ++i) ind[i] = 0;


        //   std::printf("ndim=%ld dimj=%ld _s0=%ld _s1=%ld _s2=%ld _p0=%p _p1=%p _p2=%p\n",

        //        ndim,dimj,_s0,_s1,_s2,_p0,_p1,_p2);

        //   for (int i=0; i<ndim; ++i) {

        //     std::printf("   %d dim=%ld stride0=%ld stride1=%ld stride2=%ld\n",

        //      i,dim[i],stride0[i],stride1[i],stride2[i]);

        //   }

    }


    template <class T, class Q, class R>


    TensorIterator<T,Q,R>& TensorIterator<T,Q,R>::operator++() {

        long d = ndim-1;

        if (d<0 || _p0==0) {

            _p0 = 0;

            return *this;

        }

        while (ind[d] >= (dim[d] - 1)) {

            _p0 -= ind[d] * stride0[d];

            if (_p1)    _p1 -= ind[d] * stride1[d];

            if (_p2)    _p2 -= ind[d] * stride2[d];

            ind[d] = 0;

            d--;

            if (d < 0) {

                _p0 = 0;

                return *this;

            }

        }

        _p0 += stride0[d];

        if (_p1) _p1 += stride1[d];

        if (_p2) _p2 += stride2[d];

        ++(ind[d]);

        return *this;

    }


    /// Reset the iterator back to the start ...

    template <class T, class Q, class R>


    void TensorIterator<T,Q,R>::reset() {

        _p0 = _p0_save;

        _p1 = _p1_save;

        _p2 = _p2_save;

        for (int i=0; i<TENSOR_MAXDIM; ++i) ind[i] = 0;

    }


    /// Reuse this iterator to iterate over other Tensors


    /// The point of this method is to optimize away the construction of a

    /// TensorIterator when applying the same operation repeatedly to

    /// multiple tensors with identical shapes & strides.  We trust the

    /// caller to ensure all shapes & strides match between the new

    /// tensors and the ones used in the original constructor.

    template <class T, class Q, class R>


    void TensorIterator<T,Q,R>::reuse(const Tensor<T>* t0,

                                      const Tensor<Q> *t1,

                                      const Tensor<R> *t2) {

        _p0 = _p0_save = t0->ptr();

        if (t1) _p1 = _p1_save = t1->ptr();

        if (t2) _p2 = _p2_save = t2->ptr();

        for (int i=0; i<TENSOR_MAXDIM; ++i) ind[i] = 0;

    }


}

#endif // MADNESS_TENSOR_TENSORITER_H__INCLUDED

madness::BaseTensor::dim
long dim(int i) const
Returns the size of dimension i.
Definition basetensor.h:147

madness::BaseTensor::stride
long stride(int i) const
Returns the stride associated with dimension i.
Definition basetensor.h:150

madness::BaseTensor::ndim
long ndim() const
Returns the number of dimensions in the tensor.
Definition basetensor.h:144

madness::TensorIterator
Definition tensoriter.h:61

madness::TensorIterator::_p2_save
R * _p2_save
Definition tensoriter.h:64

madness::TensorIterator::stride0
long stride0[TENSOR_MAXDIM]
Definition tensoriter.h:76

madness::TensorIterator::operator==
bool operator==(const TensorIterator< T, Q, R > &a) const
Definition tensoriter.h:87

madness::TensorIterator::dim
long dim[TENSOR_MAXDIM]
Definition tensoriter.h:74

madness::TensorIterator::stride1
long stride1[TENSOR_MAXDIM]
Definition tensoriter.h:77

madness::TensorIterator::_p0_save
T * _p0_save
Definition tensoriter.h:62

madness::TensorIterator::reuse
void reuse(const Tensor< T > *t0, const Tensor< Q > *t1=0, const Tensor< R > *t2=0)
Reuse this iterator to iterate over other Tensors.
Definition tensoriter.h:370

madness::TensorIterator::dimj
long dimj
Definition tensoriter.h:70

madness::TensorIterator::_s1
long _s1
Definition tensoriter.h:72

madness::TensorIterator::operator!=
bool operator!=(const TensorIterator< T, Q, R > &a) const
Definition tensoriter.h:91

madness::TensorIterator::_s0
long _s0
Definition tensoriter.h:71

madness::TensorIterator::_p1
Q * _p1
Definition tensoriter.h:67

madness::TensorIterator::ndim
long ndim
Definition tensoriter.h:69

madness::TensorIterator::operator++
TensorIterator< T, Q, R > & operator++()
Definition tensoriter.h:328

madness::TensorIterator::reset
void reset()
Reset the iterator back to the start ...
Definition tensoriter.h:354

madness::TensorIterator::ind
long ind[TENSOR_MAXDIM]
Definition tensoriter.h:75

madness::TensorIterator::_p1_save
Q * _p1_save
Definition tensoriter.h:63

madness::TensorIterator::operator->
TensorIterator< T, Q, R > * operator->()
Definition tensoriter.h:95

madness::TensorIterator::operator*
T & operator*() const
Definition tensoriter.h:99

madness::TensorIterator::_p2
R * _p2
Definition tensoriter.h:68

madness::TensorIterator::_p0
T * _p0
Definition tensoriter.h:66

madness::TensorIterator::stride2
long stride2[TENSOR_MAXDIM]
Definition tensoriter.h:78

madness::TensorIterator::_s2
long _s2
Definition tensoriter.h:73

madness::Tensor
A tensor is a multidimensional array.
Definition tensor.h:317

madness::Tensor::ptr
T * ptr()
Returns a pointer to the internal data.
Definition tensor.h:1825

madness::Tensor::conforms
bool conforms(const Tensor< Q > &t) const
Test if *this and t conform.
Definition tensor.h:1657

R
static const double R
Definition csqrt.cc:46

T
auto T(World &world, response_space &f) -> response_space
Definition global_functions.cc:28

madness::TensorIterator::TensorIterator
TensorIterator(const Tensor< T > *t0, const Tensor< Q > *t1=0, const Tensor< R > *t2=0, long iterlevel=0, bool optimize=true, bool fusedim=true, long jdim=default_jdim)
Constructor for general iterator to compose operations over up to three tensors.
Definition tensoriter.h:157

madness
Namespace for all elements and tools of MADNESS.
Definition DFParameters.h:10

madness::default_jdim
static const long default_jdim
Definition tensoriter.h:57

std::abs
static long abs(long a)
Definition tensor.h:218

d
static const double d
Definition nonlinschro.cc:121

a
static const double a
Definition nonlinschro.cc:118

Q
double Q(double a)
Definition relops.cc:20

tensor.h
Defines and implements most of Tensor.

TENSOR_MAXDIM
#define TENSOR_MAXDIM
Definition tensor_macros.h:194

tensorexcept.h
Declares and implements TensorException.

TENSOR_ASSERT
#define TENSOR_ASSERT(condition, msg, value, t)
Definition tensorexcept.h:130