madness/vmra1_8h_source.html

 /*

   This file is part of MADNESS.


   Copyright (C) 2007,2010 Oak Ridge National Laboratory


   This program is free software; you can redistribute it and/or modify

   it under the terms of the GNU General Public License as published by

   the Free Software Foundation; either version 2 of the License, or

   (at your option) any later version.


   This program is distributed in the hope that it will be useful,

   but WITHOUT ANY WARRANTY; without even the implied warranty of

   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

   GNU General Public License for more details.


   You should have received a copy of the GNU General Public License

   along with this program; if not, write to the Free Software

   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA


   For more information please contact:


   Robert J. Harrison

   Oak Ridge National Laboratory

   One Bethel Valley Road

   P.O. Box 2008, MS-6367


   email: harrisonrj@ornl.gov

   tel:   865-241-3937

   fax:   865-572-0680


   $Id$

 */


 #ifndef MADNESS_MRA_VMRA_H__INCLUDED

 #define MADNESS_MRA_VMRA_H__INCLUDED


 #include <madness/mra/mra.h>

 #include <madness/mra/derivative.h>

 #include <cstdio>


 namespace madness {


     template <typename T, std::size_t NDIM>

     void compress(World& world,

                   const std::vector< Function<T,NDIM> >& v,

                   unsigned int blk=1,

                   bool fence=true){


         PROFILE_BLOCK(Vcompress);

         bool must_fence = false;

         unsigned int vvsize = v.size();

         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             if (!v[j].is_compressed()) {

               v[j].compress(false);

               must_fence = true;

             }

           }

           if ( blk!=1 && must_fence && fence) world.gop.fence();

         }


         if (fence && must_fence) world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     void reconstruct(World& world,

                      const std::vector< Function<T,NDIM> >& v,

                      unsigned int blk=1,

                      bool fence=true){ // reconstr

         PROFILE_BLOCK(Vreconstruct);

         bool must_fence = false;

         unsigned int vvsize = v.size();

         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             if (v[j].is_compressed()) {

               v[j].reconstruct(false);

               must_fence = true;

             }

           }

           if ( blk!=1 && must_fence && fence) world.gop.fence();

         }


         if (fence && must_fence) world.gop.fence();

     } // reconstr


     template <typename T, std::size_t NDIM>

       void nonstandard(World& world,

                        std::vector< Function<T,NDIM> >& v,

                        unsigned int blk=1,

                        bool fence=true) { // nonstand

         PROFILE_BLOCK(Vnonstandard);

         unsigned int vvsize = v.size();

         reconstruct(world, v, blk);

         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             v[j].nonstandard(false,false);

           }

           if ( blk!=1 && fence) world.gop.fence();

         }

         if (fence) world.gop.fence();

     } //nonstand


     template <typename T, std::size_t NDIM>

       void standard(World& world,

                     std::vector< Function<T,NDIM> >& v,

                     unsigned int blk=1,

                     bool fence=true){ // standard

         PROFILE_BLOCK(Vstandard);

         unsigned int vvsize = v.size();

         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             v[j].standard(false);

           }

           if ( blk!=1 && fence) world.gop.fence();

         }

         if (fence) world.gop.fence();

     } // standard


     template <typename T, std::size_t NDIM>

     void truncate(World& world,

                   std::vector< Function<T,NDIM> >& v,

                   double tol=0.0,

                   unsigned int blk=1,

                   bool fence=true){ // truncate

         PROFILE_BLOCK(Vtruncate);


         compress(world, v, blk);


         unsigned int vvsize = v.size();

         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             v[j].truncate(tol, false);

           }

           if ( blk!=1 && fence) world.gop.fence();

         }

         if (fence) world.gop.fence();

     } //truncate


     template <typename T, std::size_t NDIM>

       std::vector< Function<T,NDIM> >

       apply(World& world,

              const Derivative<T,NDIM>& D,

              const std::vector< Function<T,NDIM> >& v,

              const unsigned int blk=1,

              const bool fence=true)

       {

         reconstruct(world, v, blk);

         std::vector< Function<T,NDIM> > df(v.size());


         unsigned int vvsize = v.size();


         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             df[j] = D(v[j],false);

           }

           if (blk!= 1 && fence) world.gop.fence();

         }

         if (fence) world.gop.fence();


         return df;

       }


     template <typename T, std::size_t NDIM>

       std::vector< Function<T,NDIM> >

       zero_functions(World& world, int n) {

       PROFILE_BLOCK(Vzero_functions);

       std::vector< Function<T,NDIM> > r(n);

       for (int i=0; i<n; ++i)

         r[i] = Function<T,NDIM>(FunctionFactory<T,NDIM>(world));


       return r;

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> >

       transform(World& world,

                 const std::vector< Function<T,NDIM> >& v,

                 const Tensor<R>& c,

                 unsigned int blki=1,

                 unsigned int blkj=1,

                 const bool fence=true){


       PROFILE_BLOCK(Vtransformsp);


       typedef TENSOR_RESULT_TYPE(T,R) resultT;


       unsigned int blk = min(blki, blkj);

       unsigned int n = v.size();  // n is the old dimension

       unsigned int m = c.dim(1);  // m is the new dimension

       MADNESS_ASSERT(n==c.dim(0));


       std::vector< Function<resultT,NDIM> > vc = zero_functions<resultT,NDIM>(world, m);

       compress(world, v, blk);

       compress(world, vc, blk); // what to do ?


       for (unsigned int i=0; i<m; i+= blki) {

         for (unsigned int ii=i; ii<std::min(m,(i+1)*blki); ii++) {

           for (unsigned int j=0; j<n; j+= blkj) {

             for (unsigned int jj=j; jj<std::min(n, (j+1)*blkj); jj++)

               if (c(jj,ii) != R(0.0)) vc[ii].gaxpy(1.0,v[jj],c(jj,ii),false);

             if (fence && (blkj!=1)) world.gop.fence();

           }

         }

         if (fence && (blki!=1)) world.gop.fence();  // a bit conservative

       }


       //      for (unsigned int i=0; i<m; ++i) {

       // for (unsigned int j=0; j<n; ++j) {

       // if (c(j,i) != R(0.0)) vc[i].gaxpy(1.0,v[j],c(j,i),false);

       // }

       // }


       if (fence) world.gop.fence();

       return vc;

     }


     template <typename L, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(L,R),NDIM> >

       transform(World& world,

                 const std::vector< Function<L,NDIM> >& v,

                 const Tensor<R>& c,

                 const double tol,

                 const unsigned int blki=1,

                 const bool fence)

       {

         PROFILE_BLOCK(Vtransform);

         MADNESS_ASSERT(v.size() == (unsigned int)(c.dim(0)));


         std::vector< Function<TENSOR_RESULT_TYPE(L,R),NDIM> > vresult(c.dim(1));

         unsigned int m=c.dim(1);


         for (unsigned int i=0; i<m; i+= blki) {

           for (unsigned int ii=i; ii<std::min(m,(i+1)*blki); ii++) {

             vresult[ii] = Function<TENSOR_RESULT_TYPE(L,R),NDIM>(FunctionFactory<TENSOR_RESULT_TYPE(L,R),NDIM>(world));

           }

           if (fence && (blki!=1)) world.gop.fence();  // a bit conservative

         }


         //        for (unsigned int i=0; i<c.dim(1); ++i) {

         // vresult[i] = Function<TENSOR_RESULT_TYPE(L,R),NDIM>(FunctionFactory<TENSOR_RESULT_TYPE(L,R),NDIM>(world));

         // }

         compress(world, v, blki, false);

         compress(world, vresult, blki, false);

         world.gop.fence();

         vresult[0].vtransform(v, c, vresult, tol, fence);

         return vresult;

       }


     template <typename T, typename Q, std::size_t NDIM>

       void scale(World& world,

                  std::vector< Function<T,NDIM> >& v,

                  const std::vector<Q>& factors,

                  const unsigned int blk=1,

                  const bool fence=true)

       {

         PROFILE_BLOCK(Vscale);


         unsigned int vvsize = v.size();

         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             v[j].scale(factors[j],false);

           }

           if (fence && blk!=1 ) world.gop.fence();

         }

         if (fence) world.gop.fence();

       }


     template <typename T, typename Q, std::size_t NDIM>

       void scale(World& world,

                  std::vector< Function<T,NDIM> >& v,

                   const Q factor,

                  const unsigned int blk=1,

                  const bool fence=true){


         PROFILE_BLOCK(Vscale); // shouldn't need blocking since it is local


         unsigned int vvsize = v.size();

         for (unsigned int i=0; i<vvsize; i+= blk) {

           for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

             v[j].scale(factor,false);

           }

           if (fence && blk!=1 ) world.gop.fence();

         }

         if (fence) world.gop.fence();

       }


     template <typename T, std::size_t NDIM>

       std::vector<double> norm2s(World& world,

                                  const std::vector< Function<T,NDIM> >& v,

                                  const unsigned int blk=1,

                                  const bool fence=true){


       PROFILE_BLOCK(Vnorm2);

       unsigned int vvsize = v.size();

       std::vector<double> norms(vvsize);


       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j) {

           norms[j] = v[j].norm2sq_local();

         }

         if (fence && (blk!=1)) world.gop.fence();

       }

       if (fence ) world.gop.fence();


       world.gop.sum(&norms[0], norms.size());


       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           norms[j] = sqrt(norms[j]);

         if (fence && (blk!=1)) world.gop.fence();

       }


       world.gop.fence();

       return norms;

     }


     // should be local; norms[0] contains the result


     template <typename T, std::size_t NDIM>

       double norm2(World& world,

                    const std::vector< Function<T,NDIM> >& v)

       {


         PROFILE_BLOCK(Vnorm2);


         std::vector<double> norms(v.size());


         for (unsigned int i=0; i<v.size(); ++i)

           norms[i] = v[i].norm2sq_local();


         world.gop.sum(&norms[0], norms.size());


         for (unsigned int i=1; i<v.size(); ++i)

           norms[0] += norms[i];


         world.gop.fence();

         return sqrt(norms[0]);

       }


     inline double conj(double x) {

       return x;

     }


     inline double conj(float x) {

       return x;

     }


     template <typename T, typename R, std::size_t NDIM>

     struct MatrixInnerTask : public TaskInterface {

         Tensor<TENSOR_RESULT_TYPE(T,R)> result; // Must be a copy

         const Function<T,NDIM>& f;

         const std::vector< Function<R,NDIM> >& g;

         long jtop;


         MatrixInnerTask(const Tensor<TENSOR_RESULT_TYPE(T,R)>& result,

                 const Function<T,NDIM>& f,

                 const std::vector< Function<R,NDIM> >& g,

                 long jtop)

         : result(result), f(f), g(g), jtop(jtop) {}


         void run(World& world) {

             for (long j=0; j<jtop; ++j) {

                 result(j) = f.inner_local(g[j]);

             }

         }


     private:


         virtual void get_id(std::pair<void*,unsigned short>& id) const {

             PoolTaskInterface::make_id(id, *this);

         }

     }; // struct MatrixInnerTask


     template <typename T, typename R, std::size_t NDIM>

       Tensor< TENSOR_RESULT_TYPE(T,R) > matrix_inner(World& world,

                                                      const std::vector< Function<T,NDIM> >& f,

                                                      const std::vector< Function<R,NDIM> >& g,

                                                      bool sym=false) {

       PROFILE_BLOCK(Vmatrix_inner);

       unsigned int n=f.size(), m=g.size();

       Tensor< TENSOR_RESULT_TYPE(T,R) > r(n,m);

       if (sym) MADNESS_ASSERT(n==m);


       world.gop.fence();

       compress(world, f);

       if (&f != &g) compress(world, g);


       //         for (long i=0; i<n; ++i) {

       //             long jtop = m;

       //             if (sym) jtop = i+1;

       //             for (long j=0; j<jtop; ++j) {

       //                 r(i,j) = f[i].inner_local(g[j]);

       //                 if (sym) r(j,i) = conj(r(i,j));

       //             }

       //         }


       for (unsigned int i=n-1; i>=0; --i) {

         unsigned int jtop = m;

         if (sym) jtop = i+1;

         world.taskq.add(new MatrixInnerTask<T,R,NDIM>(r(i,_), f[i], g, jtop));

       }

       world.gop.fence();

       world.gop.sum(r.ptr(),n*m);


       if (sym) {

         for (unsigned int i=0; i<n; ++i) {

           for (unsigned int j=0; j<i; ++j) {

             r(j,i) = conj(r(i,j));

           }

         }

       }

       return r;

     }


     template <typename T, typename R, std::size_t NDIM>

       Tensor< TENSOR_RESULT_TYPE(T,R) > inner(World& world,

                                               const std::vector< Function<T,NDIM> >& f,

                                               const std::vector< Function<R,NDIM> >& g) {

       PROFILE_BLOCK(Vinnervv);

       long n=f.size(), m=g.size();

       MADNESS_ASSERT(n==m);

       Tensor< TENSOR_RESULT_TYPE(T,R) > r(n);


       compress(world, f);

       compress(world, g);


       for (long i=0; i<n; ++i) {

         r(i) = f[i].inner_local(g[i]);

       }


       world.taskq.fence();

       world.gop.sum(r.ptr(),n);

       world.gop.fence();

       return r;

     }


     template <typename T, typename R, std::size_t NDIM>

       Tensor< TENSOR_RESULT_TYPE(T,R) > inner(World& world,

                                               const Function<T,NDIM>& f,

                                               const std::vector< Function<R,NDIM> >& g) {

       PROFILE_BLOCK(Vinner);

       long n=g.size();

       Tensor< TENSOR_RESULT_TYPE(T,R) > r(n);


       f.compress();

       compress(world, g);


       for (long i=0; i<n; ++i) {

         r(i) = f.inner_local(g[i]);

       }


       world.taskq.fence();

       world.gop.sum(r.ptr(),n);

       world.gop.fence();

       return r;

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       mul(World& world,

           const Function<T,NDIM>& a,

           const std::vector< Function<R,NDIM> >& v,

           const unsigned int blk=1,

           const bool fence=true) {


       PROFILE_BLOCK(Vmul);

       a.reconstruct(false);

       reconstruct(world, v, blk, false);

       world.gop.fence();

       return vmulXX(a, v, 0.0, fence);

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       mul_sparse(World& world,

                  const Function<T,NDIM>& a,

                  const std::vector< Function<R,NDIM> >& v,

                  const double tol,

                  const bool fence=true,

                  const unsigned int blk=1)

  {

       PROFILE_BLOCK(Vmulsp);

       a.reconstruct(false);

       reconstruct(world, v, blk, false);

       world.gop.fence();


       unsigned int vvsize = v.size();

       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           v[j].norm_tree(false);

         if ( fence && (blk == 1)) world.gop.fence();

       }

       a.norm_tree();

       return vmulXX(a, v, tol, fence);

     }


     template <typename T, std::size_t NDIM>

       void norm_tree(World& world,

                      const std::vector< Function<T,NDIM> >& v,

                      bool fence=true,

                      unsigned int blk=1){

         PROFILE_BLOCK(Vnorm_tree);


       unsigned int vvsize = v.size();

       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           v[j].norm_tree(false);

         if (fence && blk!=1 ) world.gop.fence();

       }

       if (fence) world.gop.fence();

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       mul(World& world,

           const std::vector< Function<T,NDIM> >& a,

           const std::vector< Function<R,NDIM> >& b,

           bool fence=true,

           unsigned int blk=1){

       PROFILE_BLOCK(Vmulvv);

       reconstruct(world, a, blk, false);

       if (&a != &b) reconstruct(world, b, blk, false);

       world.gop.fence();


       std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > q(a.size());


       unsigned int vvsize = a.size();

       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           q[j] = mul(a[j], b[j], false);

         if (fence && (blk !=1 )) world.gop.fence();

       }

       if (fence) world.gop.fence();

       return q;

     }


     template <typename T, std::size_t NDIM>

       std::vector< Function<T,NDIM> >

       square(World& world,

              const std::vector< Function<T,NDIM> >& v,

              bool fence=true) {

       return mul<T,T,NDIM>(world, v, v, fence);

       //         std::vector< Function<T,NDIM> > vsq(v.size());

       //         for (unsigned int i=0; i<v.size(); ++i) {

       //             vsq[i] = square(v[i], false);

       //         }

       //         if (fence) world.gop.fence();

       //         return vsq;

     }


     template <typename T, std::size_t NDIM>

       void set_thresh(World& world,

                       std::vector< Function<T,NDIM> >& v,

                       double thresh,

                       bool fence=true) {

       for (unsigned int j=0; j<v.size(); ++j) {

         v[j].set_thresh(thresh,false);

       }

       if (fence) world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

       std::vector< Function<T,NDIM> >

       conj(World& world,

            const std::vector< Function<T,NDIM> >& v,

            bool fence=true){

       PROFILE_BLOCK(Vconj);

       std::vector< Function<T,NDIM> > r = copy(world, v); // Currently don't have oop conj

       for (unsigned int i=0; i<v.size(); ++i) {

         r[i].conj(false);

       }

       if (fence) world.gop.fence();

       return r;

     }


     template <typename T, std::size_t NDIM>

       std::vector< Function<T,NDIM> >

       copy(World& world,

            const std::vector< Function<T,NDIM> >& v,

            bool fence=true) {

       PROFILE_BLOCK(Vcopy);

       std::vector< Function<T,NDIM> > r(v.size());

       for (unsigned int i=0; i<v.size(); ++i) {

         r[i] = copy(v[i], false);

       }

       if (fence) world.gop.fence();

       return r;

     }


     template <typename T, std::size_t NDIM>

       std::vector< Function<T,NDIM> >

       copy(World& world,

            const Function<T,NDIM>& v,

            const unsigned int n,

            bool fence=true) {

       PROFILE_BLOCK(Vcopy1);

       std::vector< Function<T,NDIM> > r(n);

       for (unsigned int i=0; i<n; ++i) {

         r[i] = copy(v, false);

       }

       if (fence) world.gop.fence();

       return r;

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       add(World& world,

           const std::vector< Function<T,NDIM> >& a,

           const std::vector< Function<R,NDIM> >& b,

           bool fence=true,

           unsigned int blk=1) {

       PROFILE_BLOCK(Vadd);

       MADNESS_ASSERT(a.size() == b.size());

       compress(world, a, blk);

       compress(world, b, blk);


       std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > r(a.size());


       unsigned int vvsize = a.size();

       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           r[j] = add(a[j], b[j], false);

         if (fence && (blk !=1 )) world.gop.fence();

       }

       if (fence) world.gop.fence();


       return r;

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       add(World& world,

           const Function<T,NDIM> & a,

           const std::vector< Function<R,NDIM> >& b,

            bool fence=true,

           unsigned int blk=1) {


       PROFILE_BLOCK(Vadd1);

       a.compress();

       compress(world, b, blk);


       std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > r(b.size());


       unsigned int vvsize = b.size();

       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           r[j] = add(a, b[j], false);

         if (fence && (blk !=1 )) world.gop.fence();

       }

       if (fence) world.gop.fence();


       return r;

     }


     template <typename T, typename R, std::size_t NDIM>

       inline std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       add(World& world,

           const std::vector< Function<R,NDIM> >& b,

           const Function<T,NDIM> & a,

            bool fence=true,

           unsigned int blk=1) {

       return add(world, a, b, fence, blk);

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       sub(World& world,

            const std::vector< Function<T,NDIM> >& a,

            const std::vector< Function<R,NDIM> >& b,

            bool fence=true,

            unsigned int blk=1) {

       PROFILE_BLOCK(Vsub);

       MADNESS_ASSERT(a.size() == b.size());

       compress(world, a, fence, blk);

       compress(world, b, fence, blk);


       std::vector< Function<TENSOR_RESULT_TYPE(T,R),NDIM> > r(a.size());


       unsigned int vvsize = a.size();

       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           r[j] = sub(a[j], b[j], false);

         if (fence && (blk !=1 )) world.gop.fence();

       }

       if (fence) world.gop.fence();

       return r;

     }


     template <typename T, typename Q, typename R, std::size_t NDIM>

       void gaxpy(World& world,

                  Q alpha,

                  std::vector< Function<T,NDIM> >& a,

                  Q beta,

                  const std::vector< Function<R,NDIM> >& b,

                  unsigned int blk=1,

                  bool fence=true) {

       PROFILE_BLOCK(Vgaxpy);

       MADNESS_ASSERT(a.size() == b.size());

       compress(world, a, fence, blk);

       compress(world, b, fence, blk);


       unsigned int vvsize = a.size();


       for (unsigned int i=0; i<vvsize; i+= blk) {

         for (unsigned int j=i; j<std::min(vvsize,(i+1)*blk); ++j)

           a[j].gaxpy(alpha, b[j], beta, false);


         if (fence && (blk !=1 )) world.gop.fence();


       }

       //      for (unsigned int i=0; i<a.size(); ++i) {

       //        a[i].gaxpy(alpha, b[i], beta, false);

       // }

       if (fence) world.gop.fence();

     }


     template <typename opT, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(typename opT::opT,R), NDIM> >

       apply(World& world,

             const std::vector< std::shared_ptr<opT> >& op,

             const std::vector< Function<R,NDIM> > f,

             const unsigned int blk=1){


       PROFILE_BLOCK(Vapplyv);

       MADNESS_ASSERT(f.size()==op.size());


       std::vector< Function<R,NDIM> >& ncf = *const_cast< std::vector< Function<R,NDIM> >* >(&f);


       reconstruct(world, f, blk);

       nonstandard(world, ncf, blk);


       std::vector< Function<TENSOR_RESULT_TYPE(typename opT::opT,R), NDIM> > result(f.size());

       unsigned int ff = f.size();


       for (unsigned int i=0; i<ff; ++blk) {

         for (unsigned int j=i; j<std::min(ff,(i+1)*blk); ++j)

           result[j] = apply_only(*op[j], f[j], false);

         if (blk !=1)

           world.gop.fence();

       }


       world.gop.fence();


       standard(world, ncf, false);  // restores promise of logical constness

       world.gop.fence();

       reconstruct(world, result, blk);


       return result;

     }


     template <typename T, typename R, std::size_t NDIM>

       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> >

       apply(World& world,

             const SeparatedConvolution<T,NDIM>& op,

             const std::vector< Function<R,NDIM> > f,

             const unsigned int blk=1) {

       PROFILE_BLOCK(Vapply);


       std::vector< Function<R,NDIM> >& ncf = *const_cast< std::vector< Function<R,NDIM> >* >(&f);


       reconstruct(world, f, blk);

       nonstandard(world, ncf, blk);


       std::vector< Function<TENSOR_RESULT_TYPE(T,R), NDIM> > result(f.size());


       unsigned int ff = f.size();

       for (unsigned int i=0; i<ff; ++blk) {

         for (unsigned int j=i; j<std::min(ff,(i+1)*blk); ++j)

           result[j] = apply_only(op, f[j], false);

         if (blk !=1)

           world.gop.fence();

       }

       world.gop.fence();


       standard(world, ncf, blk, false);  // restores promise of logical constness

       world.gop.fence();

       reconstruct(world, result, blk);


       return result;

     }


     template <typename T, std::size_t NDIM>

       void normalize(World& world,

                      std::vector< Function<T,NDIM> >& v,

                      bool fence=true){


       PROFILE_BLOCK(Vnormalize);

       std::vector<double> nn = norm2s(world, v);


       for (unsigned int i=0; i<v.size(); ++i)

         v[i].scale(1.0/nn[i],false);


       if (fence) world.gop.fence();

     }


 }

 #endif // MADNESS_MRA_VMRA_H__INCLUDED

madness::matrix_inner
void matrix_inner(DistributedMatrix< T > &A, const std::vector< Function< T, NDIM > > &f, const std::vector< Function< T, NDIM > > &g, bool sym=false)
Definition: chem/distpm.cc:38

madness::World::gop
WorldGopInterface & gop
Global operations.
Definition: worldfwd.h:462

madness::MatrixInnerTask::jtop
long jtop
Definition: vmra1.h:468

madness::tr1::shptr::shared_ptr
Definition: shared_ptr_bits.h:38

madness::reconstruct
void reconstruct(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Reconstruct a vector of functions.
Definition: vmra.h:149

R
const double R
Definition: dielectric.cc:191

mra.h
Main include file for MADNESS and defines Function interface.

madness::gaxpy
void gaxpy(World &world, Q alpha, std::vector< Function< T, NDIM > > &a, Q beta, const std::vector< Function< R, NDIM > > &b, bool fence=true)
Generalized A*X+Y for vectors of functions -— a[i] = alpha*a[i] + beta*b[i].
Definition: vmra.h:680

madness::MatrixInnerTask::run
void run(World &world)
Runs a single-threaded task ... derived classes must implement this.
Definition: vmra1.h:476

madness::Function::compress
const Function< T, NDIM > & compress(bool fence=true) const
Compresses the function, transforming into wavelet basis. Possible non-blocking comm.
Definition: mra.h:683

madness::Derivative
Implements derivatives operators with variety of boundary conditions on simulation domain...
Definition: derivative.h:272

madness::truncate
void truncate(World &world, std::vector< Function< T, NDIM > > &v, double tol=0.0, bool fence=true)
Truncates a vector of functions.
Definition: vmra.h:194

madness::SeparatedConvolution< T, NDIM >

madness::nonstandard
void nonstandard(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Generates non-standard form of a vector of functions.
Definition: vmra.h:167

madness::f
NDIM & f
Definition: mra.h:2179

madness::apply_only
Function< TENSOR_RESULT_TYPE(typename opT::opT, R), NDIM > apply_only(const opT &op, const Function< R, NDIM > &f, bool fence=true)
Apply operator ONLY in non-standard form - required other steps missing !!
Definition: mra.h:1942

derivative.h
Declaration and initialization of tree traversal functions and generic derivative.

madness::add
Function< TENSOR_RESULT_TYPE(L, R), NDIM > add(const Function< L, NDIM > &left, const Function< R, NDIM > &right, bool fence=true)
Same as operator+ but with optional fence and no automatic compression.
Definition: mra.h:1734

madness::TENSOR_RESULT_TYPE
TENSOR_RESULT_TYPE(T, R) inner(const Function<T
Computes the scalar/inner product between two functions.

madness::norm_tree
void norm_tree(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Makes the norm tree for all functions in a vector.
Definition: vmra.h:506

beta
const double beta
Definition: gygi_soltion.cc:63

madness::inner
T inner(const vecfunc< T, NDIM > &a, const vecfunc< T, NDIM > &b)
the non-linear solver requires an inner product
Definition: nemo.h:112

madness::norm2s
std::vector< double > norm2s(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norms of a vector of functions.
Definition: vmra.h:312

madness::MatrixInnerTask
Definition: vmra1.h:464

PROFILE_BLOCK
#define PROFILE_BLOCK(name)
Definition: worldprofile.h:197

std::tr1::T
const T1 &f1 return GTEST_2_TUPLE_() T(f0, f1)

madness::scale
void scale(World &world, std::vector< Function< T, NDIM > > &v, const std::vector< Q > &factors, bool fence=true)
Scales inplace a vector of functions by distinct values.
Definition: vmra.h:290

madness::Function::reconstruct
void reconstruct(bool fence=true) const
Reconstructs the function, transforming into scaling function basis. Possible non-blocking comm...
Definition: mra.h:737

madness::copy
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence. ...
Definition: mra.h:1835

mpfr::min
const mpreal min(const mpreal &x, const mpreal &y)
Definition: mpreal.h:2675

madness::sub
Function< TENSOR_RESULT_TYPE(L, R), NDIM > sub(const Function< L, NDIM > &left, const Function< R, NDIM > &right, bool fence=true)
Same as operator- but with optional fence and no automatic compression.
Definition: mra.h:1778

a
FLOAT a(int j, FLOAT z)
Definition: y1.cc:86

madness::vmulXX
std::vector< Function< TENSOR_RESULT_TYPE(L, R), D > > vmulXX(const Function< L, D > &left, const std::vector< Function< R, D > > &vright, double tol, bool fence=true)
Use the vmra/mul(...) interface instead.
Definition: mra.h:1634

madness::MatrixInnerTask::MatrixInnerTask
MatrixInnerTask(const Tensor< TENSOR_RESULT_TYPE(T, R)> &result, const Function< T, NDIM > &f, const std::vector< Function< R, NDIM > > &g, long jtop)
Definition: vmra1.h:470

madness::set_thresh
void set_thresh(World &world, std::vector< Function< T, NDIM > > &v, double thresh, bool fence=true)
Sets the threshold in a vector of functions.
Definition: vmra.h:556

madness::WorldGopInterface::sum
void sum(T *buf, size_t nelem)
Inplace global sum while still processing AM & tasks.
Definition: worldgop.h:767

madness::standard
void standard(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Generates standard form of a vector of functions.
Definition: vmra.h:181

sqrt
tensorT sqrt(const tensorT &s, double tol=1e-8)
Computes matrix square root (not used any more?)
Definition: DFcode/moldft.cc:446

madness::square
Function< T, NDIM > square(const Function< T, NDIM > &f, bool fence=true)
Create a new function that is the square of f - global comm only if not reconstructed.
Definition: mra.h:1806

madness::World
A parallel world with full functionality wrapping an MPI communicator.
Definition: worldfwd.h:416

madness::WorldGopInterface::fence
void fence()
Synchronizes all processes in communicator AND globally ensures no pending AM or tasks.
Definition: worldgop.cc:52

madness::norm2
double norm2(World &world, const std::vector< Function< T, NDIM > > &v)
Computes the 2-norm of a vector of functions.
Definition: vmra.h:325

madness::Function
A multiresolution adaptive numerical function.
Definition: derivative.h:61

madness::MatrixInnerTask::g
const std::vector< Function< R, NDIM > > & g
Definition: vmra1.h:467

m
const double m
Definition: gfit.cc:199

madness::Function::fence
impl world gop fence()

madness::mul_sparse
Function< TENSOR_RESULT_TYPE(L, R), NDIM > mul_sparse(const Function< L, NDIM > &left, const Function< R, NDIM > &right, double tol, bool fence=true)
Sparse multiplication — left and right must be reconstructed and if tol!=0 have tree of norms alread...
Definition: mra.h:1569

madness::PoolTaskInterface::make_id
static enable_if_c< detail::function_traits< fnT >::value||detail::memfunc_traits< fnT >::value >::type make_id(std::pair< void *, unsigned short > &id, fnT fn)
Definition: worldthread.h:680

madness::Function::size
std::size_t size() const
Returns the number of coefficients in the function ... collective global sum.
Definition: mra.h:515

op
Tensor< double > op(const Tensor< double > &x)
Definition: kain.cc:508

madness::MatrixInnerTask::f
const Function< T, NDIM > & f
Definition: vmra1.h:466

madness::Function::norm_tree
void norm_tree(bool fence=true) const
Initializes information about the function norm at all length scales.
Definition: mra.h:663

madness::TaskInterface
All world tasks must be derived from this public interface.
Definition: taskfn.h:68

madness::FunctionFactory
FunctionFactory implements the named-parameter idiom for Function.
Definition: funcimpl.h:70

madness::MatrixInnerTask::result
Tensor< TENSOR_RESULT_TYPE(T, R)> result
Definition: vmra1.h:465

madness
Holds machinery to set up Functions/FuncImpls using various Factories and Interfaces.
Definition: chem/atomutil.cc:45

madness::apply
Function< T, NDIM > apply(const Derivative< T, NDIM > &D, const Function< T, NDIM > &f, bool fence=true)
Applies derivative operator to function (for syntactic equivalence to integral operator apply) ...
Definition: derivative.h:613

c
const double c
Definition: gfit.cc:200

madness::transform
std::vector< Function< TENSOR_RESULT_TYPE(T, R), NDIM > > transform(World &world, const std::vector< Function< T, NDIM > > &v, const DistributedMatrix< R > &c, bool fence=true)
Definition: chem/SCF.cc:86

b
FLOAT b(int j, FLOAT z)
Definition: y1.cc:79

madness::normalize
void normalize(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Normalizes a vector of functions — v[i] = v[i].scale(1.0/v[i].norm2())
Definition: vmra.h:765

madness::zero_functions
std::vector< Function< T, NDIM > > zero_functions(World &world, int n)
Generates a vector of zero functions.
Definition: vmra.h:229

madness::mul
Function< TENSOR_RESULT_TYPE(Q, T), NDIM > mul(const Q alpha, const Function< T, NDIM > &f, bool fence=true)
Returns new function equal to alpha*f(x) with optional fence.
Definition: mra.h:1528

madness::conj
Function< T, NDIM > conj(const Function< T, NDIM > &f, bool fence=true)
Return the complex conjugate of the input function with the same distribution and optional fence...
Definition: mra.h:1879

madness::compress
void compress(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Compress a vector of functions.
Definition: vmra.h:130