madness/mraimpl_8h_source.html

 /*

   This file is part of MADNESS.


   Copyright (C) 2007,2010 Oak Ridge National Laboratory


   This program is free software; you can redistribute it and/or modify

   it under the terms of the GNU General Public License as published by

   the Free Software Foundation; either version 2 of the License, or

   (at your option) any later version.


   This program is distributed in the hope that it will be useful,

   but WITHOUT ANY WARRANTY; without even the implied warranty of

   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

   GNU General Public License for more details.


   You should have received a copy of the GNU General Public License

   along with this program; if not, write to the Free Software

   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA


   For more information please contact:


   Robert J. Harrison

   Oak Ridge National Laboratory

   One Bethel Valley Road

   P.O. Box 2008, MS-6367


   email: harrisonrj@ornl.gov

   tel:   865-241-3937

   fax:   865-572-0680


   $Id$

 */


 #ifndef MADNESS_MRA_MRAIMPL_H__INCLUDED

 #define MADNESS_MRA_MRAIMPL_H__INCLUDED


 #ifndef MPRAIMPLX

 #error "mraimpl.h should ONLY be included in one of the mraX.cc files (x=1..6)"

 #endif


 //#define WORLD_INSTANTIATE_STATIC_TEMPLATES

 #include <math.h>

 #include <madness/world/worldobj.h>

 #include <madness/world/worlddc.h>

 #include <madness/world/worldhashmap.h>

 #include <madness/mra/function_common_data.h>


 #include <madness/mra/funcimpl.h>

 #include <madness/mra/displacements.h>


 namespace madness {


     // Definition and initialization of FunctionDefaults static members

     // It cannot be an instance of FunctionFactory since we want to

     // set the defaults independent of the data type.


     template <typename T, std::size_t NDIM>

     void FunctionCommonData<T,NDIM>::_init_twoscale() {

         if (! two_scale_hg(k, &hg)) throw "failed to get twoscale coefficients";

         hgT = copy(transpose(hg));


         Slice sk(0,k-1), sk2(k,-1);

         hgsonly = copy(hg(Slice(0,k-1),_));


         h0 = copy(hg(sk,sk));

         h1 = copy(hg(sk,sk2));

         g0 = copy(hg(sk2,sk));

         g1 = copy(hg(sk2,sk2));


         h0T = copy(transpose(hg(sk,sk)));

         h1T = copy(transpose(hg(sk,sk2)));

         g0T = copy(transpose(hg(sk2,sk)));

         g1T = copy(transpose(hg(sk2,sk2)));


     }


     template <typename T, std::size_t NDIM>

     void FunctionCommonData<T,NDIM>::_init_quadrature

     (int k, int npt, Tensor<double>& quad_x, Tensor<double>& quad_w,

      Tensor<double>& quad_phi, Tensor<double>& quad_phiw, Tensor<double>& quad_phit) {

         quad_x = Tensor<double>(npt);

         quad_w = Tensor<double>(npt);

         quad_phi = Tensor<double>(npt,k);

         quad_phiw = Tensor<double>(npt,k);


         gauss_legendre(npt,0.0,1.0,quad_x.ptr(),quad_w.ptr());

         for (int mu=0; mu<npt; ++mu) {

             double phi[200];

             legendre_scaling_functions(quad_x(mu),k,phi);

             for (int j=0; j<k; ++j) {

                 quad_phi(mu,j) = phi[j];

                 quad_phiw(mu,j) = quad_w(mu)*phi[j];

             }

         }

         quad_phit = transpose(quad_phi);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::verify_tree() const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         world.gop.fence();  // Make sure nothing is going on


         // Verify consistency of compression status, existence and size of coefficients,

         // and has_children() flag.

         for (typename dcT::const_iterator it=coeffs.begin(); it!=coeffs.end(); ++it) {

             const keyT& key = it->first;

             const nodeT& node = it->second;

             bool bad;


             if (is_compressed()) {

                 if (node.has_children()) {

                     bad = (node.coeff().has_data()) and (node.coeff().dim(0) != 2*cdata.k);

                 }

                 else {

                     //                    bad = node.coeff().size() != 0;

                     bad = node.coeff().has_data();

                 }

             }

             else {

                 if (node.has_children()) {

                     //                    bad = node.coeff().size() != 0;

                     bad = node.coeff().has_data();

                 }

                 else {

                     bad = (node.coeff().has_data()) and ( node.coeff().dim(0) != cdata.k);

                 }

             }


             if (bad) {

                 print(world.rank(), "FunctionImpl: verify: INCONSISTENT TREE NODE, key =", key, ", node =", node,

                       ", dim[0] =",node.coeff().dim(0),", compressed =",is_compressed());

                 std::cout.flush();

                 MADNESS_EXCEPTION("FunctionImpl: verify: INCONSISTENT TREE NODE", 0);

             }

         }


         // Ensure that parents and children exist appropriately

         for (typename dcT::const_iterator it=coeffs.begin(); it!=coeffs.end(); ++it) {

             const keyT& key = it->first;

             const nodeT& node = it->second;


             if (key.level() > 0) {

                 const keyT parent = key.parent();

                 typename dcT::const_iterator pit = coeffs.find(parent).get();

                 if (pit == coeffs.end()) {

                     print(world.rank(), "FunctionImpl: verify: MISSING PARENT",key,parent);

                     std::cout.flush();

                     MADNESS_EXCEPTION("FunctionImpl: verify: MISSING PARENT", 0);

                 }

                 const nodeT& pnode = pit->second;

                 if (!pnode.has_children()) {

                     print(world.rank(), "FunctionImpl: verify: PARENT THINKS IT HAS NO CHILDREN",key,parent);

                     std::cout.flush();

                     MADNESS_EXCEPTION("FunctionImpl: verify: PARENT THINKS IT HAS NO CHILDREN", 0);

                 }

             }


             for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                 typename dcT::const_iterator cit = coeffs.find(kit.key()).get();

                 if (cit == coeffs.end()) {

                     if (node.has_children()) {

                         print(world.rank(), "FunctionImpl: verify: MISSING CHILD",key,kit.key());

                         std::cout.flush();

                         MADNESS_EXCEPTION("FunctionImpl: verify: MISSING CHILD", 0);

                     }

                 }

                 else {

                     if (! node.has_children()) {

                         print(world.rank(), "FunctionImpl: verify: UNEXPECTED CHILD",key,kit.key());

                         std::cout.flush();

                         MADNESS_EXCEPTION("FunctionImpl: verify: UNEXPECTED CHILD", 0);

                     }

                 }

             }

         }


         world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     const std::shared_ptr< WorldDCPmapInterface< Key<NDIM> > >& FunctionImpl<T,NDIM>::get_pmap() const {

         return coeffs.get_pmap();

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::gaxpy_oop_reconstructed(const double alpha, const implT& f,

                                                        const double beta, const implT& g, const bool fence) {


         MADNESS_ASSERT(not f.is_compressed());

         MADNESS_ASSERT(not g.is_compressed());


         ProcessID owner = coeffs.owner(cdata.key0);

         if (world.rank() == owner) {


             CoeffTracker<T,NDIM> ff(&f);

             CoeffTracker<T,NDIM> gg(&g);


             typedef add_op coeff_opT;

             coeff_opT coeff_op(ff,gg,alpha,beta);

             typedef insert_op<T,NDIM> apply_opT;

             apply_opT apply_op(this);


             woT::task(world.rank(), &implT:: template forward_traverse<coeff_opT,apply_opT>,

                       coeff_op, apply_op, cdata.key0);


         }


         this->compressed=false;

         if (fence) world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::is_compressed() const {

         return compressed;

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::is_redundant() const {

         return redundant;

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::is_nonstandard() const {return nonstandard;}


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::set_functor(const std::shared_ptr<FunctionFunctorInterface<T,NDIM> > functor1) {

         this->on_demand=true;

         functor=functor1;

     }


     template <typename T, std::size_t NDIM>

     std::shared_ptr<FunctionFunctorInterface<T,NDIM> > FunctionImpl<T,NDIM>::get_functor() {

         MADNESS_ASSERT(this->functor);

         return functor;

     }


     template <typename T, std::size_t NDIM>

     std::shared_ptr<FunctionFunctorInterface<T,NDIM> > FunctionImpl<T,NDIM>::get_functor() const {

         MADNESS_ASSERT(this->functor);

         return functor;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::unset_functor() {

         this->on_demand=false;

         functor.reset();

     }


     template <typename T, std::size_t NDIM>

     bool& FunctionImpl<T,NDIM>::is_on_demand() {return on_demand;};


     template <typename T, std::size_t NDIM>

     const bool& FunctionImpl<T,NDIM>::is_on_demand() const {return on_demand;};


     template <typename T, std::size_t NDIM>

     TensorType FunctionImpl<T,NDIM>::get_tensor_type() const {return targs.tt;}


     template <typename T, std::size_t NDIM>

     TensorArgs FunctionImpl<T,NDIM>::get_tensor_args() const {return targs;}


     template <typename T, std::size_t NDIM>

     double FunctionImpl<T,NDIM>::get_thresh() const {return thresh;}


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::set_thresh(double value) {thresh = value;}


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::get_autorefine() const {return autorefine;}


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::set_autorefine(bool value) {autorefine = value;}


     template <typename T, std::size_t NDIM>

     int FunctionImpl<T,NDIM>::get_k() const {return k;}


     template <typename T, std::size_t NDIM>

     const typename FunctionImpl<T,NDIM>::dcT& FunctionImpl<T,NDIM>::get_coeffs() const {return coeffs;}


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::dcT& FunctionImpl<T,NDIM>::get_coeffs() {return coeffs;}


     template <typename T, std::size_t NDIM>

     const FunctionCommonData<T,NDIM>& FunctionImpl<T,NDIM>::get_cdata() const {return cdata;}


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::accumulate_timer(const double time) const {

         timer_accumulate.accumulate(time);

         return None;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::print_timer() const {

         if (world.rank()==0) {

             timer_accumulate.print("accumulate");

             timer_target_driven.print("target_driven");

             timer_lr_result.print("result2low_rank");

         }

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::reset_timer() {

         if (world.rank()==0) {

             timer_accumulate.reset();

             timer_target_driven.reset();

             timer_lr_result.reset();

         }

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::truncate(double tol, bool fence) {

         // Cannot put tol into object since it would make a race condition

         if (tol <= 0.0)

             tol = thresh;

         if (world.rank() == coeffs.owner(cdata.key0)) {

             if (is_compressed()) {

                 truncate_spawn(cdata.key0,tol);

             } else {

                 truncate_reconstructed_spawn(cdata.key0,tol);

             }

         }

         if (fence)

             world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     const typename FunctionImpl<T,NDIM>::keyT& FunctionImpl<T,NDIM>::key0() const {

         return cdata.key0;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::print_plane(const std::string filename, const int xaxis, const int yaxis, const coordT& el2) {


         // get the local information

         Tensor<double> localinfo=print_plane_local(xaxis,yaxis,el2);


         // lump all the local information together, and gather on node0

         std::vector<Tensor<double> > localinfo_vec(1,localinfo);

         std::vector<Tensor<double> > printinfo=world.gop.concat0(localinfo_vec);

         world.gop.fence();


         // do the actual print

         if (world.rank()==0) do_print_plane(filename,printinfo,xaxis,yaxis,el2);


     }


     template <typename T, std::size_t NDIM>

     Tensor<double> FunctionImpl<T,NDIM>::print_plane_local(const int xaxis, const int yaxis, const coordT& el2) {

         coordT x_sim;

         user_to_sim<NDIM>(el2,x_sim);

         x_sim[2]+=1.e-10;


         // dimensions are: (# boxes)(hue, x lo left, y lo left, x hi right, y hi right)

         Tensor<double> plotinfo(coeffs.size(),5);

         long counter=0;


         // loop over local boxes, if the fit, add the info to the output tensor

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             const keyT& key = it->first;

             const nodeT& node = it->second;


             // thisKeyContains ignores dim0 and dim1

             if (key.thisKeyContains(x_sim,xaxis,yaxis) and node.is_leaf() and (node.has_coeff())) {


                 Level n=key.level();

                 Vector<Translation,NDIM> l=key.translation();

                 // get the diametral edges of the node in the plotting plane

                 double scale=std::pow(0.5,double(n));

                 double xloleft = scale*l[xaxis];

                 double yloleft = scale*l[yaxis];

                 double xhiright = scale*(l[xaxis]+1);

                 double yhiright = scale*(l[yaxis]+1);


                 // convert back to user coordinates

                 Vector<double,4> user;

                 user[0]=xloleft*FunctionDefaults<NDIM>::get_cell_width()[xaxis] + FunctionDefaults<NDIM>::get_cell()(xaxis,0);

                 user[2]=xhiright*FunctionDefaults<NDIM>::get_cell_width()[xaxis] + FunctionDefaults<NDIM>::get_cell()(xaxis,0);

                 user[1]=yloleft*FunctionDefaults<NDIM>::get_cell_width()[yaxis] + FunctionDefaults<NDIM>::get_cell()(yaxis,0);

                 user[3]=yhiright*FunctionDefaults<NDIM>::get_cell_width()[yaxis] + FunctionDefaults<NDIM>::get_cell()(yaxis,0);


                 //                    if ((xloleft<-5.0) or (yloleft<-5.0) or (xhiright>5.0) or (yhiright>5.0)) continue;

                 if ((user[0]<-5.0) or (user[1]<-5.0) or (user[2]>5.0) or (user[3]>5.0)) continue;


                 // do rank or do error

                 double color=0.0;

                 if (1) {


                     const double maxrank=40;

                     do_convert_to_color hue(maxrank,false);

                     color=hue(node.coeff().rank());

                 } else {


                     // Make quadrature rule of higher order

                     const int npt = cdata.npt + 1;

                     Tensor<double> qx, qw, quad_phi, quad_phiw, quad_phit;

                     FunctionCommonData<T,NDIM>::_init_quadrature(k+1, npt, qx, qw, quad_phi, quad_phiw, quad_phit);

                     do_err_box< FunctionFunctorInterface<T,NDIM> > op(this, this->get_functor().get(), npt, qx, quad_phit, quad_phiw);


                     do_convert_to_color hue(1000.0,true);

                     double error=op(it);

                     error=sqrt(error);//*pow(2,key.level()*6);

                     color=hue(error);

                 }


                 plotinfo(counter,0)=color;

                 plotinfo(counter,1)=user[0];

                 plotinfo(counter,2)=user[1];

                 plotinfo(counter,3)=user[2];

                 plotinfo(counter,4)=user[3];

                 ++counter;

             }

         }


         // shrink the info

         if (counter==0) plotinfo=Tensor<double>();

         else plotinfo=plotinfo(Slice(0,counter-1),Slice(_));

         return plotinfo;

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::do_print_plane(const std::string filename, std::vector<Tensor<double> > plotinfo,

                                               const int xaxis, const int yaxis, const coordT el2) {


         // invoke only on master node

         MADNESS_ASSERT(world.rank()==0);


         // prepare file

         FILE * pFile;

         pFile = fopen(filename.c_str(), "w");

         Tensor<double> cell=FunctionDefaults<NDIM>::get_cell();


         fprintf(pFile,"\\psset{unit=1cm}\n");

         fprintf(pFile,"\\begin{pspicture}(%4.2f,%4.2f)(%4.2f,%4.2f)\n",

                 //                      cell(xaxis,0),cell(xaxis,1),cell(yaxis,0),cell(yaxis,1));

                 -5.0,-5.0,5.0,5.0);

         fprintf(pFile,"\\pslinewidth=0.1pt\n");


         for (std::vector<Tensor<double> >::const_iterator it=plotinfo.begin(); it!=plotinfo.end(); ++it) {


             Tensor<double> localinfo=*it;

             if (localinfo.has_data()) {


                 for (long i=0; i<localinfo.dim(0); ++i) {


                     fprintf(pFile,"\\newhsbcolor{mycolor}{%8.4f 1.0 0.7}\n",localinfo(i,0));

                     fprintf(pFile,"\\psframe["//linewidth=0.5pt,"

                             "fillstyle=solid,"

                             "fillcolor=mycolor]"

                             "(%12.8f,%12.8f)(%12.8f,%12.8f)\n",

                             localinfo(i,1),localinfo(i,2),localinfo(i,3),localinfo(i,4));

                 }

             }

         }


         fprintf(pFile,"\\end{pspicture}\n");

         fclose(pFile);


         return None;

     }


     template <typename T, std::size_t NDIM>

     void  FunctionImpl<T,NDIM>::print_grid(const std::string filename) const {


         // get the local information

         std::vector<keyT> local_keys=local_leaf_keys();


         // lump all the local information together, and gather on node0

         std::vector<keyT> all_keys=world.gop.concat0(local_keys);

         world.gop.fence();


         // do the actual print

         if (world.rank()==0) do_print_grid(filename,all_keys);


     }


     template <typename T, std::size_t NDIM>

     std::vector<typename FunctionImpl<T,NDIM>::keyT>  FunctionImpl<T,NDIM>::local_leaf_keys() const {


         // coeffs.size is maximum number of keys (includes internal keys)

         std::vector<keyT> keys(coeffs.size());


         // loop over local boxes, if they are leaf boxes add their quadrature roots

         // to the output tensor

         int i=0;

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             const keyT& key = it->first;

             const nodeT& node = it->second;

             if (node.is_leaf()) keys[i++]=key;

         }


         // shrink the vector to number of leaf keys

         keys.resize(i);

         return keys;

     }


     template <typename T, std::size_t NDIM>

     void  FunctionImpl<T,NDIM>::do_print_grid(const std::string filename, const std::vector<keyT>& keys) const {

         // invoke only on master node

         MADNESS_ASSERT(world.rank()==0);


         // the quadrature points in simulation coordinates of the root node

         const Tensor<double> qx=cdata.quad_x;

         const size_t npt = qx.dim(0);


         // the number of coordinates (grid point tuples) per box ({x1},{x2},{x3},..,{xNDIM})

         long npoints=power<NDIM>(npt);

         // the number of boxes

         long nboxes=keys.size();


         // prepare file

         FILE * pFile;

         pFile = fopen(filename.c_str(), "w");


         fprintf(pFile,"%ld\n",npoints*nboxes);

         fprintf(pFile,"%ld points per box and %ld boxes \n",npoints,nboxes);


         // loop over all leaf boxes

         typename std::vector<keyT>::const_iterator key_it=keys.begin();

         for (key_it=keys.begin(); key_it!=keys.end(); ++key_it) {


             const keyT& key=*key_it;

             fprintf(pFile,"# key: %8d",key.level());

             for (size_t d=0; d<NDIM; d++) fprintf(pFile,"%8d",int(key.translation()[d]));

             fprintf(pFile,"\n");


             // this is borrowed from fcube

             const Vector<Translation,NDIM>& l = key.translation();

             const Level n = key.level();

             const double h = std::pow(0.5,double(n));

             coordT c; // will hold the point in user coordinates


             const Tensor<double>& cell_width = FunctionDefaults<NDIM>::get_cell_width();

             const Tensor<double>& cell = FunctionDefaults<NDIM>::get_cell();


             if (NDIM == 3) {

                 for (size_t i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (size_t j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (size_t k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             // grid weights

                             //                                              double scale = pow(0.5,0.5*NDIM*key.level())*

                             //                                                          sqrt(FunctionDefaults<NDIM>::get_cell_volume());

                             //                                              double w=cdata.quad_phiw[i]*cdata.quad_phiw[j]*cdata.quad_phiw[k];


                             fprintf(pFile,"%18.12f %18.12f %18.12f\n",c[0],c[1],c[2]);

                             //                                                          fprintf(pFile,"%18.12e %18.12e %18.12e %18.12e\n",c[0],c[1],c[2],w*scale);

                         }

                     }

                 }

             } else {

                 MADNESS_EXCEPTION("only NDIM=3 in print_grid",0);

             }

         }

         fclose(pFile);

     }


     template <typename T, std::size_t NDIM>

     double FunctionImpl<T,NDIM>::truncate_tol(double tol, const keyT& key) const {

         const static double fac=1.0/std::pow(2,NDIM*0.5);

         tol*=fac;


         // RJH ... introduced max level here to avoid runaway

         // refinement due to truncation threshold going down to

         // intrinsic numerical error

         const int MAXLEVEL1 = 20; // 0.5**20 ~= 1e-6

         const int MAXLEVEL2 = 10; // 0.25**10 ~= 1e-6


         if (truncate_mode == 0) {

             return tol;

         }

         else if (truncate_mode == 1) {

             double L = FunctionDefaults<NDIM>::get_cell_min_width();

             return tol*std::min(1.0,pow(0.5,double(std::min(key.level(),MAXLEVEL1)))*L);

         }

         else if (truncate_mode == 2) {

             double L = FunctionDefaults<NDIM>::get_cell_min_width();

             return tol*std::min(1.0,pow(0.25,double(std::min(key.level(),MAXLEVEL2)))*L*L);

         }

         else {

             MADNESS_EXCEPTION("truncate_mode invalid",truncate_mode);

         }

     }


     template <typename T, std::size_t NDIM>

     std::vector<Slice> FunctionImpl<T,NDIM>::child_patch(const keyT& child) const {

         std::vector<Slice> s(NDIM);

         const Vector<Translation,NDIM>& l = child.translation();

         for (std::size_t i=0; i<NDIM; ++i)

             s[i] = cdata.s[l[i]&1]; // Lowest bit of translation

         return s;

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::parent_to_child_NS(const keyT& child, const keyT& parent,

                                                                                    const coeffT& coeff) const {


         const implT* f=this;

         //              MADNESS_ASSERT(coeff.tensor_type()==TT_FULL);

         coeffT result;


         // if the node for child is existent in f, and it is an internal node, we

         // automatically have the NS form; if it is a leaf node, we only have the

         // sum coeffs, so we take zero difference coeffs

         if (child==parent) {

             if (coeff.dim(0)==2*f->get_k()) result=coeff;               // internal node

             else if (coeff.dim(0)==f->get_k()) {                        // leaf node

                 tensorT t(f->cdata.v2k);

                 t(f->cdata.s0)=coeff.full_tensor_copy();

                 result=coeffT(t,f->get_tensor_args());

             } else {

                 MADNESS_EXCEPTION("confused k in parent_to_child_NS",1);

             }

         } else if (child.level()>parent.level()) {


             // parent and coeff should refer to a leaf node with sum coeffs only

             // b/c tree should be compressed with leaves kept.

             MADNESS_ASSERT(coeff.dim(0)==f->get_k());

             const coeffT coeff1=f->parent_to_child(coeff,parent,child);

             tensorT t(f->cdata.v2k);

             t(f->cdata.s0)=coeff1.full_tensor_copy();

             result=coeffT(t,f->get_tensor_args());

         } else {

             MADNESS_EXCEPTION("confused keys in parent_to_child_NS",1);

         }

         return result;

     }


     template <typename T, std::size_t NDIM>

     Key<NDIM> FunctionImpl<T,NDIM>::simpt2key(const coordT& pt, Level n) const {

         Vector<Translation,NDIM> l;

         double twon = std::pow(2.0, double(n));

         for (std::size_t i=0; i<NDIM; ++i) {

             l[i] = Translation(twon*pt[i]);

         }

         return Key<NDIM>(n,l);

     }


     // N=2^n, M=N/q, q must be power of 2

     // q=0 return coeffs [N,k] for direct sum

     // q>0 return coeffs [k,q,M] for fft sum

     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::tensorT FunctionImpl<T,NDIM>::coeffs_for_jun(Level n, long q) {

         MADNESS_ASSERT(compressed && nonstandard && NDIM<=3);

         tensorT r,r0;

         long N=1<<n;

         long M = (q ? N/q: N);

         if (q==0) {

             q = 1;

             long dim[2*NDIM];

             for (std::size_t d=0; d<NDIM; ++d) {

                 dim[d ] = N;

                 dim[d+NDIM] = cdata.k;

             }

             tensorT rr(2*NDIM,dim);

             r0=r=rr;

             //NNkk->MqMqkk, since fuse is not allowed. Now needs to move back to 2*NDIM, since tensor max dim is 6

             //for (int d=NDIM-1; d>=0; --d) r.splitdim_inplace_base(d,M,q);

         } else {

             long dim[2*NDIM];

             for (std::size_t d=0; d<NDIM; ++d) {

                 //dim[d+NDIM*2] = M;

                 dim[d+NDIM ] = N;

                 dim[d ] = cdata.k;

             }

             tensorT rr(2*NDIM,dim);

             r0=rr;

             /*vector<long> map(3*NDIM);

               for (int d=0; d<NDIM; ++d) {

               map[d]=d+2*NDIM;

               map[NDIM+d]=2*d+1;

               map[2*NDIM+d]=2*d;

               }

               r.mapdim_inplace_base(map);

               //print(rr);

               //for (int d=1; d<NDIM; ++d) rr.swapdim_inplace_base(2*NDIM+d,NDIM+d); //kkqqMM->kkqMqM

               //print(rr);

               //for (int d=0; d<NDIM; ++d) rr.swapdim_inplace_base(NDIM+2*d,NDIM+2*d-1); //kkqMqM->kkMqMq

               //print(rr);

               //for (int d=0; d<NDIM; ++d) rr.fusedim_inplace_base(NDIM+d); //->kkNN

               //seems that this fuse is not allowed :(


               //print(rr);

               */

             r=rr.cycledim(NDIM,0,-1); //->NNkk or MqMqkk

         }

         print("faking done M q r(fake) r0(real)",M,q,"\n", std::vector<long> (r.dims(),r.dims()+6),std::vector<long> (r0.dims(),r0.dims()+6));

         ProcessID me = world.rank();

         Vector<long,NDIM> t(N);


         Vector<long,NDIM> powq, powN, powM;

         long NDIM1 = NDIM-1;

         powM[NDIM1]=powq[NDIM1]=powN[NDIM1]=1;

         for (int d=NDIM1-1; d>=0; --d) {

             powM[d] = powM[d+1]*M;

             powq[d] = powq[d+1]*q;

             powN[d] = powN[d+1]*N;

         }

         long powMNDIM = powM[0]*M;


         for (IndexIterator it(t); it; ++it) {

             keyT key(n, Vector<Translation,NDIM>(*it));

             if (coeffs.owner(key) == me) {

                 typename dcT::iterator it = coeffs.find(key).get();

                 coeffT qq;


                 if (it == coeffs.end()) {

                     // must get from above

                     typedef std::pair< keyT,coeffT > pairT;

                     Future<pairT> result;

                     sock_it_to_me(key, result.remote_ref(world));

                     const keyT& parent = result.get().first;

                     //                        const tensorT& t = result.get().second.full_tensor_copy();

                     const coeffT& t = result.get().second;


                     qq = (parent_to_child(t, parent, key));

                 } else {

                     qq = copy(it->second.coeff());

                 }

                 std::vector<Slice> s(NDIM*2);

                 long ll = 0;

                 for (std::size_t d=0; d<NDIM; ++d) {

                     Translation l = key.translation()[d];

                     long dum = long(float(l)/q);

                     ll += (l - dum*q)*powMNDIM*powq[d] + dum*powM[d];

                     //ll += (l % q)*powM[NDIM]*pow((double)q,NDIM-d-1) + (l/q)*pow((double)M,NDIM-d-1);


                     //print("translation",l);

                     //s[d       ] = Slice(l,l,0);

                     //s[d+NDIM  ] = Slice(l%q,l%q,0);

                     //s[d+NDIM] = Slice(0,k-1,1);

                 }

                 //long dum = ll;

                 for (std::size_t d=0; d<NDIM; ++d) {

                     Translation l = Translation(float(ll) / powN[d]);

                     //Translation l = ll / pow((double)N,NDIM-d-1);

                     s[d ] = Slice(l,l,0);

                     s[d+NDIM] = Slice(0,k-1,1);

                     ll = ll - l*powN[d];

                     //ll = ll % long(pow((double)N,NDIM-d-1));

                 }

                 //print(s, dum, key.translation());

                 coeffT qqq=qq(cdata.s0);

                 r(s) = qqq.full_tensor_copy();


             }

         }


         world.gop.fence();

         world.gop.sum(r0);

         //print(r,r0);


         return r0;

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::erase(const Level& max_level) {

         this->make_redundant(true);


         typename dcT::iterator end = coeffs.end();

         for (typename dcT::iterator it= coeffs.begin(); it!=end; ++it) {

             keyT key=it->first;

             nodeT& node=it->second;

             if (key.level()>max_level) coeffs.erase(key);

             if (key.level()==max_level) node.set_has_children(false);

         }

         this->undo_redundant(true);

         return None;

     };


     template <typename T, std::size_t NDIM>

     double FunctionImpl<T,NDIM>::check_symmetry_local() const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         typedef Range<typename dcT::const_iterator> rangeT;

         return world.taskq.reduce<double,rangeT,do_check_symmetry_local>(rangeT(coeffs.begin(),coeffs.end()),

                                                                          do_check_symmetry_local(*this));

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::refine_to_common_level(const std::vector<FunctionImpl<T,NDIM>*>& v,

                                                       const std::vector<tensorT>& c,

                                                       const keyT key) {

         if (key == cdata.key0 && coeffs.owner(key)!=world.rank()) return None;


         // First insert coefficients from above ... also get write accessors here

         ScopedArray<typename dcT::accessor> acc(new typename dcT::accessor[v.size()]);

         for (unsigned int i=0; i<c.size(); i++) {

             MADNESS_ASSERT(v[i]->coeffs.get_pmap() == coeffs.get_pmap());

             MADNESS_ASSERT(v[i]->coeffs.owner(key) == world.rank());

             bool exists = ! v[i]->coeffs.insert(acc[i],key);

             if (c[i].size()) {

                 MADNESS_ASSERT(!exists);

                 acc[i]->second = nodeT(coeffT(c[i],targs),false);

             }

             else {

                 MADNESS_ASSERT(exists);

             }

         }


         // If everyone has coefficients we are done

         bool done = true;

         for (unsigned int i=0; i<v.size(); i++) {

             done &= acc[i]->second.has_coeff();

         }


         if (!done) {

             // Those functions with coefficients need to be refined down

             std::vector<tensorT> d(v.size());

             for (unsigned int i=0; i<v.size(); i++) {

                 if (acc[i]->second.has_coeff()) {

                     tensorT s(cdata.v2k);

                     //                        s(cdata.s0) = acc[i]->second.coeff()(___);

                     s(cdata.s0) = acc[i]->second.coeff().full_tensor_copy();

                     acc[i]->second.clear_coeff();

                     d[i] = unfilter(s);

                     acc[i]->second.set_has_children(true);

                 }

             }


             // Loop thru children and pass down

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                 const keyT& child = kit.key();

                 std::vector<Slice> cp = child_patch(child);

                 std::vector<tensorT> childc(v.size());

                 for (unsigned int i=0; i<v.size(); i++) {

                     if (d[i].size()) childc[i] = copy(d[i](cp));

                 }

                 woT::task(coeffs.owner(child), &implT::refine_to_common_level, v, childc, child);

             }

         }


         return None;

     }


     // horrifically non-scalable

     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::put_in_box(ProcessID from, long nl, long ni) const {

         if (world.size()> 1000)

             throw "NO!";

         box_leaf[from] = nl;

         box_interior[from] = ni;

         return None;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::print_info() const {

         if (world.size() >= 1000)

             return;

         for (int i=0; i<world.size(); ++i)

             box_leaf[i] = box_interior[i] == 0;

         world.gop.fence();

         long nleaf=0, ninterior=0;

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             const nodeT& node = it->second;

             if (node.is_leaf())

                 ++nleaf;

             else

                 ++ninterior;

         }

         this->send(0, &implT::put_in_box, world.rank(), nleaf, ninterior);

         world.gop.fence();

         if (world.rank() == 0) {

             for (int i=0; i<world.size(); ++i) {

                 printf("load: %5d %8ld %8ld\n", i, box_leaf[i], box_interior[i]);

             }

         }

         world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::noautorefine(const keyT& key, const tensorT& t) const {

         return false;

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::autorefine_square_test(const keyT& key, const nodeT& t) const {

         double lo, hi;

         tnorm(t.coeff().full_tensor_copy(), &lo, &hi);

         double test = 2*lo*hi + hi*hi;

         //print("autoreftest",key,thresh,truncate_tol(thresh, key),lo,hi,test);

         return test> truncate_tol(thresh, key);

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::sum_down_spawn(const keyT& key, const coeffT& s) {

         typename dcT::accessor acc;

         coeffs.insert(acc,key);

         nodeT& node = acc->second;

         coeffT& c = node.coeff();


         //print(key,"received",s.normf(),c.normf(),node.has_children());


         if (s.size() > 0) {

             if (c.size() > 0)

                 c.gaxpy(1.0,s,1.0);

             else

                 c = s;

         }


         if (node.has_children()) {

             coeffT d;

             if (c.has_data()) {

                 d = coeffT(cdata.v2k,targs);

                 d(cdata.s0) += c;

                 d = unfilter(d);

                 node.clear_coeff();

             }

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                 coeffT ss;

                 const keyT& child = kit.key();

                 if (d.size() > 0) ss = copy(d(child_patch(child)));

                 //print(key,"sending",ss.normf(),"to",child);

                 woT::task(coeffs.owner(child), &implT::sum_down_spawn, child, ss);

             }

         }

         else {

             // Missing coeffs assumed to be zero

             if (c.size() <= 0) c = coeffT(cdata.vk,targs);

         }

         return None;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::sum_down(bool fence) {

         if (world.rank() == coeffs.owner(cdata.key0)) sum_down_spawn(cdata.key0, coeffT());


         if (fence) world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::forward_do_diff1(const DerivativeBase<T,NDIM>* D,

                                                 const implT* f,

                                                 const keyT& key,

                                                 const std::pair<keyT,coeffT>& left,

                                                 const std::pair<keyT,coeffT>& center,

                                                 const std::pair<keyT,coeffT>& right) {

         return D->forward_do_diff1(f,this,key,left,center,right);

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::do_diff1(const DerivativeBase<T,NDIM>* D,

                                         const implT* f,

                                         const keyT& key,

                                         const std::pair<keyT,coeffT>& left,

                                         const std::pair<keyT,coeffT>& center,

                                         const std::pair<keyT,coeffT>& right) {

         return D->do_diff1(f,this,key,left,center,right);

     }


     // Called by result function to differentiate f

     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::diff(const DerivativeBase<T,NDIM>* D, const implT* f, bool fence) {

         typedef std::pair<keyT,coeffT> argT;

         typename dcT::const_iterator end = f->coeffs.end();

         for (typename dcT::const_iterator it=f->coeffs.begin(); it!=end; ++it) {

             const keyT& key = it->first;

             const nodeT& node = it->second;

             if (node.has_coeff()) {

                 Future<argT> left  = D->find_neighbor(f, key,-1);

                 argT center(key,node.coeff());

                 Future<argT> right = D->find_neighbor(f, key, 1);

                 world.taskq.add(*this, &implT::do_diff1, D, f, key, left, center, right, TaskAttributes::hipri());

             }

             else {

                 coeffs.replace(key,nodeT(coeffT(),true)); // Empty internal node

             }

         }

         if (fence) world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     std::pair<Key<NDIM>,ShallowNode<T,NDIM> > FunctionImpl<T,NDIM>::find_datum(keyT key) const {

         MADNESS_ASSERT(coeffs.probe(key));

         ShallowNode<T,NDIM> snode(coeffs.find(key).get()->second);

         return std::pair<Key<NDIM>,ShallowNode<T,NDIM> >(key,snode);

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::multiply(const coeffT& val_ket, const coeffT& val_pot, int particle) const {

         MADNESS_ASSERT(val_pot.tensor_type()==TT_FULL);

         MADNESS_ASSERT(val_ket.tensor_type()==TT_2D);

         MADNESS_ASSERT(particle==0 or particle==1);


         coeffT rr=copy(val_ket);

         // loop over all individual terms in val_ket

         std::vector<Slice> s(rr.config().dim_per_vector()+1,_);

         for (int r=0; r<rr.rank(); ++r) {

             s[0]=Slice(r,r);

             tensorT chunk=rr.config().ref_vector(particle)(s);

             chunk.emul(val_pot.full_tensor());

         }

         return rr;

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::assemble_coefficients(const keyT& key, const coeffT& coeff_ket,

                                                                                       const coeffT& vpotential1, const coeffT& vpotential2,

                                                                                       const tensorT& veri) const {


         // take a shortcut if we are already done

         bool ket_only=(not (vpotential1.has_data() or vpotential2.has_data() or veri.has_data()));

         if (ket_only) return coeff_ket;


         // switch to values instead of coefficients

         coeffT val_ket=coeffs2values(key,coeff_ket);


         // the result tensor

         coeffT val_result;

         coeffT coeff_result;


         // potential for particles 1 and 2

         if (vpotential1.has_data()) val_result+=multiply(val_ket,vpotential1,0);

         if (vpotential2.has_data()) val_result+=multiply(val_ket,vpotential2,1);


         // values for eri: this must be done in full rank...

         if (veri.has_data()) {

             tensorT val_ket2=val_ket.full_tensor_copy().emul(veri);

             if (val_result.has_data()) val_ket2+=val_result.full_tensor_copy();

             // values2coeffs expensive (30%), coeffT() (relatively) cheap (8%)

             coeff_result=coeffT(values2coeffs(key,val_ket2),this->get_tensor_args());


         } else {


             MADNESS_ASSERT(val_result.has_data());

             coeff_result=values2coeffs(key,val_result);

             coeff_result.reduce_rank(this->get_tensor_args().thresh);

         }


         return coeff_result;


     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::mapdim(const implT& f, const std::vector<long>& map, bool fence) {


         PROFILE_MEMBER_FUNC(FunctionImpl);

         const_cast<implT*>(&f)->flo_unary_op_node_inplace(do_mapdim(map,*this),fence);


     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::average(const implT& rhs) {


         rhs.flo_unary_op_node_inplace(do_average(*this),true);

         this->scale_inplace(0.5,true);

         flo_unary_op_node_inplace(do_reduce_rank(targs),true);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::change_tensor_type1(const TensorArgs& targs, bool fence) {

         flo_unary_op_node_inplace(do_change_tensor_type(targs),fence);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::reduce_rank(const TensorArgs& targs, bool fence) {

         flo_unary_op_node_inplace(do_reduce_rank(targs),fence);

     }


     //  \endcode

     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::tensorT FunctionImpl<T,NDIM>::filter(const tensorT& s) const {

         tensorT r(cdata.v2k,false);

         tensorT w(cdata.v2k,false);

         return fast_transform(s,cdata.hgT,r,w);

         //return transform(s,cdata.hgT);

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::filter(const coeffT& s) const {

         coeffT result=transform(s,cdata.hgT);

         return result;

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::tensorT FunctionImpl<T,NDIM>::unfilter(const tensorT& s) const {

         tensorT r(cdata.v2k,false);

         tensorT w(cdata.v2k,false);

         return fast_transform(s,cdata.hg,r,w);

         //return transform(s, cdata.hg);

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::unfilter(const coeffT& s) const {

         return transform(s,cdata.hg);

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::tensorT FunctionImpl<T,NDIM>::downsample(const keyT& key, const std::vector< Future<coeffT > >& v) const {


         tensorT result(cdata.vk);


         // the twoscale coefficients: for downsampling use h0/h1; see Alpert Eq (3.34a)

         const tensorT h[2] = {cdata.h0T, cdata.h1T};

         tensorT matrices[NDIM];


         // loop over all child nodes, transform and accumulate

         long i=0;

         for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {


             // get the appropriate twoscale coefficients for each dimension

             for (size_t ii=0; ii<NDIM; ++ii) matrices[ii]=h[kit.key().translation()[ii]%2];


             // transform and accumulate on the result

             result+=general_transform(v[i].get(),matrices).full_tensor_copy();


         }

         return result;

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::upsample(const keyT& key, const coeffT& coeff) const {


         // the twoscale coefficients: for upsampling use h0/h1; see Alpert Eq (3.35a/b)

         // note there are no difference coefficients; if you want that use unfilter

         const tensorT h[2] = {cdata.h0, cdata.h1};

         tensorT matrices[NDIM];


         // get the appropriate twoscale coefficients for each dimension

         for (size_t ii=0; ii<NDIM; ++ii) matrices[ii]=h[key.translation()[ii]%2];


         // transform and accumulate on the result

         const coeffT result=general_transform(coeff,matrices);

         return result;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::project(const implT& old, bool fence) {

         long kmin = std::min(cdata.k,old.cdata.k);

         std::vector<Slice> s(NDIM,Slice(0,kmin-1));

         typename dcT::const_iterator end = old.coeffs.end();

         for (typename dcT::const_iterator it=old.coeffs.begin(); it!=end; ++it) {

             const keyT& key = it->first;

             const nodeT& node = it->second;

             if (node.has_coeff()) {

                 coeffT c(cdata.vk,targs);

                 c(s) += node.coeff()(s);

                 coeffs.replace(key,nodeT(c,false));

             }

             else {

                 coeffs.replace(key,nodeT(coeffT(),true));

             }

         }

         if (fence)

             world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::exists_and_has_children(const keyT& key) const {

         return coeffs.probe(key) && coeffs.find(key).get()->second.has_children();

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::exists_and_is_leaf(const keyT& key) const {

         return coeffs.probe(key) && (not coeffs.find(key).get()->second.has_children());

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::broaden_op(const keyT& key, const std::vector< Future <bool> >& v) {

         for (unsigned int i=0; i<v.size(); ++i) {

             if (v[i]) {

                 refine_op(true_refine_test(), key);

                 break;

             }

         }

         return None;

     }


     // For each local node sets value of norm tree to 0.0

     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::zero_norm_tree() {

         typename dcT::iterator end = coeffs.end();

         for (typename dcT::iterator it=coeffs.begin(); it!=end; ++it) {

             it->second.set_norm_tree(0.0);

         }

     }


     // Broaden tree

     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::broaden(std::vector<bool> is_periodic, bool fence) {

         typename dcT::iterator end = coeffs.end();

         for (typename dcT::iterator it=coeffs.begin(); it!=end; ++it) {

             const keyT& key = it->first;

             typename dcT::accessor acc;

             MADNESS_ASSERT(coeffs.find(acc,key));

             nodeT& node = acc->second;

             if (node.has_coeff() &&

                 node.get_norm_tree() != -1.0 &&

                 node.coeff().normf() >= truncate_tol(thresh,key)) {


                 node.set_norm_tree(-1.0); // Indicates already broadened or result of broadening/refining


                 //int ndir = std::pow(3,NDIM);

                 int ndir = static_cast<int>(std::pow(static_cast<double>(3), static_cast<int>(NDIM)));

                 std::vector< Future <bool> > v = future_vector_factory<bool>(ndir);

                 keyT neigh;

                 int i=0;

                 for (HighDimIndexIterator it(NDIM,3); it; ++it) {

                     Vector<Translation,NDIM> l(*it);

                     for (std::size_t d=0; d<NDIM; ++d) {

                         const int odd = key.translation()[d] & 0x1L; // 1 if odd, 0 if even

                         l[d] -= 1; // (0,1,2) --> (-1,0,1)

                         if (l[d] == -1)

                             l[d] = -1-odd;

                         else if (l[d] ==  1)

                             l[d] = 2 - odd;

                     }

                     keyT neigh = neighbor(key, keyT(key.level(),l), is_periodic);


                     if (neigh.is_valid()) {

                         v[i++] = this->send(coeffs.owner(neigh), &implT::exists_and_has_children, neigh);

                     }

                     else {

                         v[i++].set(false);

                     }

                 }

                 woT::task(world.rank(), &implT::broaden_op, key, v);

             }

         }

         // Reset value of norm tree so that can repeat broadening

         if (fence) {

             world.gop.fence();

             zero_norm_tree();

             world.gop.fence();

         }

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::trickle_down(bool fence) {

         //            MADNESS_ASSERT(is_redundant());

         nonstandard = compressed = redundant = false;

         //            this->print_size("in trickle_down");

         if (world.rank() == coeffs.owner(cdata.key0))

             woT::task(world.rank(), &implT::trickle_down_op, cdata.key0,coeffT());

         if (fence)

             world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::trickle_down_op(const keyT& key, const coeffT& s) {

         // Note that after application of an integral operator not all

         // siblings may be present so it is necessary to check existence

         // and if absent insert an empty leaf node.

         //

         // If summing the result of an integral operator (i.e., from

         // non-standard form) there will be significant scaling function

         // coefficients at all levels and possibly difference coefficients

         // in leaves, hence the tree may refine as a result.

         typename dcT::iterator it = coeffs.find(key).get();

         if (it == coeffs.end()) {

             coeffs.replace(key,nodeT(coeffT(),false));

             it = coeffs.find(key).get();

         }

         nodeT& node = it->second;


         // The integral operator will correctly connect interior nodes

         // to children but may leave interior nodes without coefficients

         // ... but they still need to sum down so just give them zeros

         if (node.coeff().has_no_data()) node.coeff()=coeffT(cdata.vk,targs);


         //            if (node.has_children() || node.has_coeff()) { // Must allow for inconsistent state from transform, etc.

         if (node.has_children()) { // Must allow for inconsistent state from transform, etc.

             coeffT d = node.coeff();

             if (key.level() > 0) d += s; // -- note accumulate for NS summation

             node.clear_coeff();

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                 const keyT& child = kit.key();

                 coeffT ss= upsample(child,d);

                 ss.reduce_rank(thresh);

                 PROFILE_BLOCK(recon_send);

                 woT::task(coeffs.owner(child), &implT::trickle_down_op, child, ss);

             }

         }

         else {

             node.coeff()+=s;

             node.coeff().reduce_rank(thresh);

         }

         return None;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::reconstruct(bool fence) {

         // Must set true here so that successive calls without fence do the right thing

         MADNESS_ASSERT(not is_redundant());

         nonstandard = compressed = redundant = false;

         if (world.rank() == coeffs.owner(cdata.key0))

             woT::task(world.rank(), &implT::reconstruct_op, cdata.key0,coeffT());

         if (fence)

             world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::compress(bool nonstandard, bool keepleaves, bool redundant, bool fence) {

         MADNESS_ASSERT(not is_redundant());

         // Must set true here so that successive calls without fence do the right thing

         this->compressed = true;

         this->nonstandard = nonstandard;

         this->redundant = redundant;


         // these two are exclusive

         MADNESS_ASSERT(not (redundant and nonstandard));

         // otherwise we loose information

         if (redundant) {MADNESS_ASSERT(keepleaves);}


         //            this->print_tree();

         if (world.rank() == coeffs.owner(cdata.key0)) {


             compress_spawn(cdata.key0, nonstandard, keepleaves, redundant);

         }

         if (fence)

             world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::make_redundant(const bool fence) {


         // fast return if possible

         if (is_redundant()) return;


         // NS form might have leaf sum coeffs, but we don't know

         // change to standard compressed form

         if (is_nonstandard()) this->standard(true);


         // we need the leaf sum coeffs, so reconstruct

         if (is_compressed()) reconstruct(true);


         compress(false,true,true,fence);

         compressed=false;


     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::undo_redundant(const bool fence) {


         if (!is_redundant()) return;

         redundant = compressed = nonstandard = false;

         flo_unary_op_node_inplace(remove_internal_coeffs(),fence);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::norm_tree(bool fence) {

         if (world.rank() == coeffs.owner(cdata.key0))

             norm_tree_spawn(cdata.key0);

         if (fence)

             world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     double FunctionImpl<T,NDIM>::norm_tree_op(const keyT& key, const std::vector< Future<double> >& v) {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         double sum = 0.0;

         int i=0;

         for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {

             double value = v[i].get();

             sum += value*value;

         }

         sum = sqrt(sum);

         coeffs.task(key, &nodeT::set_norm_tree, sum); // why a task?????????????????????

         //if (key.level() == 0) std::cout << "NORM_TREE_TOP " << sum << "\n";

         return sum;

     }


     template <typename T, std::size_t NDIM>

     Future<double> FunctionImpl<T,NDIM>::norm_tree_spawn(const keyT& key) {

         nodeT& node = coeffs.find(key).get()->second;

         if (node.has_children()) {

             std::vector< Future<double> > v = future_vector_factory<double>(1<<NDIM);

             int i=0;

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {

                 v[i] = woT::task(coeffs.owner(kit.key()), &implT::norm_tree_spawn, kit.key());

             }

             return woT::task(world.rank(),&implT::norm_tree_op, key, v);

         }

         else {

             //                return Future<double>(node.coeff().normf());

             const double norm=node.coeff().normf();

             // invoked locally anyways

             node.set_norm_tree(norm);

             return Future<double>(norm);

         }

     }


     template <typename T, std::size_t NDIM>

     Future<typename FunctionImpl<T,NDIM>::coeffT> FunctionImpl<T,NDIM>::truncate_reconstructed_spawn(const keyT& key, const double tol) {

         MADNESS_ASSERT(coeffs.probe(key));

         nodeT& node = coeffs.find(key).get()->second;


         // if this is a leaf node just return the sum coefficients

         if (not node.has_children()) return Future<coeffT>(node.coeff());


         // if this is an internal node, wait for all the children's sum coefficients

         // and use them to determine if the children can be removed

         std::vector<Future<coeffT> > v = future_vector_factory<coeffT>(1<<NDIM);

         int i=0;

         for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {

             v[i] = woT::task(coeffs.owner(kit.key()), &implT::truncate_reconstructed_spawn, kit.key(),tol,TaskAttributes::hipri());

         }


         // will return (possibly empty) sum coefficients

         return woT::task(world.rank(),&implT::truncate_reconstructed_op,key,v,tol,TaskAttributes::hipri());


     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::truncate_reconstructed_op(const keyT& key, const std::vector< Future<coeffT > >& v, const double tol) {


         MADNESS_ASSERT(coeffs.probe(key));


         // the sum coefficients might be empty, which means they come from an internal node

         // and we must not truncate; so just return empty coeffs again

         for (size_t i=0; i<v.size(); ++i) if (v[i].get().has_no_data()) return coeffT();


         typename dcT::accessor acc;

         MADNESS_ASSERT(coeffs.find(acc, key));


         //

         // !! THIS IS NO NUMERICALLY STABLE CODE !!

         //

 #if 0

         // the sum coefficients on this level, and their norm

         const tensorT s=downsample(key,v);

         const double snorm=s.normf();


         // get the norm of all child coefficients

         double dnorm=0.0;

         for (size_t i=0; i<v.size(); ++i) {

             const double d=v[i].get().normf();

             dnorm+=d*d;

         }


         // the error; equivalent to the norm of the wavelet coefficients

         const double error=sqrt(dnorm-snorm*snorm);

 #else

         int i=0;

         tensorT d(cdata.v2k);

         for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {

             //                d(child_patch(kit.key())) += v[i].get();

             d(child_patch(kit.key())) += v[i].get().full_tensor_copy();

         }


         d = filter(d);

         tensorT s=copy(d(cdata.s0));

         d(cdata.s0) = 0.0;

         const double error=d.normf();


 #endif

         nodeT& node = coeffs.find(key).get()->second;


         if (error < truncate_tol(tol,key)) {

             node.set_has_children(false);

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                 coeffs.erase(kit.key());

             }

             // "replace" children with new sum coefficients

             coeffT ss=coeffT(s,targs);

             acc->second.set_coeff(ss);

             return ss;

         } else {

             return coeffT();

         }

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::compress_op(const keyT& key, const std::vector< Future<coeffT > >& v, bool nonstandard, bool redundant) {

         PROFILE_MEMBER_FUNC(FunctionImpl);


         MADNESS_ASSERT(not redundant);

         double cpu0=cpu_time();

         // Copy child scaling coeffs into contiguous block

         tensorT d(cdata.v2k);

         //            coeffT d(cdata.v2k,targs);

         int i=0;

         for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {

             //                d(child_patch(kit.key())) += v[i].get();

             d(child_patch(kit.key())) += v[i].get().full_tensor_copy();

         }


         d = filter(d);

         double cpu1=cpu_time();

         timer_filter.accumulate(cpu1-cpu0);

         cpu0=cpu1;


         typename dcT::accessor acc;

         MADNESS_ASSERT(coeffs.find(acc, key));


         if (acc->second.has_coeff()) {

             print(" stuff in compress_op");

             //                const coeffT& c = acc->second.coeff();

             const tensorT c = acc->second.coeff().full_tensor_copy();

             if (c.dim(0) == k) {

                 d(cdata.s0) += c;

             }

             else {

                 d += c;

             }

         }


         // tighter thresh for internal nodes

         TensorArgs targs2=targs;

         targs2.thresh*=0.1;


         // need the deep copy for contiguity

         coeffT ss=coeffT(copy(d(cdata.s0)),targs2);


         if (key.level()> 0 && !nonstandard)

             d(cdata.s0) = 0.0;


         // insert either sum or difference coefficients

         if (redundant) {

             acc->second.set_coeff(ss);

         } else {

             coeffT dd=coeffT(d,targs2);

             acc->second.set_coeff(dd);

         }

         cpu1=cpu_time();

         timer_compress_svd.accumulate(cpu1-cpu0);


         // return sum coefficients

         return ss;

     }


     template <typename T, std::size_t NDIM>

     typename FunctionImpl<T,NDIM>::coeffT FunctionImpl<T,NDIM>::make_redundant_op(const keyT& key, const std::vector< Future<coeffT > >& v) {


         // get the sum coefficients of this level given the sum coefficients of level n+1

         TensorArgs targs2=targs;

         targs2.thresh*=0.1;

         coeffT s(this->downsample(key,v),targs2);


         // insert sum coefficients into tree

         typename dcT::accessor acc;

         MADNESS_ASSERT(coeffs.find(acc, key));

         MADNESS_ASSERT(not (acc->second.has_coeff()));

         acc->second.set_coeff(s);


         return s;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::standard(bool fence) {


         flo_unary_op_node_inplace(do_standard(this),fence);

         nonstandard = false;

     }


     template <typename T, std::size_t NDIM>

     double FunctionImpl<T,NDIM>::finalize_apply(const bool fence) {

         TensorArgs tight_args(targs);

         tight_args.thresh*=0.01;

         double begin=wall_time();

         flo_unary_op_node_inplace(do_consolidate_buffer(tight_args),true);


         // reduce the rank of the final nodes, leave full tensors unchanged

         //            flo_unary_op_node_inplace(do_reduce_rank(tight_args.thresh),true);

         flo_unary_op_node_inplace(do_reduce_rank(targs),true);


         // change TT_FULL to low rank

         flo_unary_op_node_inplace(do_change_tensor_type(targs),true);


         // truncate leaf nodes to avoid excessive tree refinement

         flo_unary_op_node_inplace(do_truncate_NS_leafs(this),true);


         double end=wall_time();

         double elapsed=end-begin;

         this->compressed=true;

         this->nonstandard=true;

         this->redundant=false;

         if (fence) world.gop.fence();

         return elapsed;

     }


     template <typename T, std::size_t NDIM>

     double FunctionImpl<T,NDIM>::norm2sq_local() const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         typedef Range<typename dcT::const_iterator> rangeT;

         return world.taskq.reduce<double,rangeT,do_norm2sq_local>(rangeT(coeffs.begin(),coeffs.end()),

                                                                   do_norm2sq_local());

     }


     template <typename T, std::size_t NDIM>

     std::size_t FunctionImpl<T,NDIM>::max_local_depth() const {

         std::size_t maxdepth = 0;

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             std::size_t N = (std::size_t) it->first.level();

             if (N> maxdepth)

                 maxdepth = N;

         }

         return maxdepth;

     }


     template <typename T, std::size_t NDIM>

     std::size_t FunctionImpl<T,NDIM>::max_depth() const {

         std::size_t maxdepth  = max_local_depth();

         world.gop.max(maxdepth);

         return maxdepth;

     }


     template <typename T, std::size_t NDIM>

     std::size_t FunctionImpl<T,NDIM>::max_nodes() const {

         std::size_t maxsize = 0;

         maxsize = coeffs.size();

         world.gop.max(maxsize);

         return maxsize;

     }


     template <typename T, std::size_t NDIM>

     std::size_t FunctionImpl<T,NDIM>::min_nodes() const {

         std::size_t minsize = 0;

         minsize = coeffs.size();

         world.gop.min(minsize);

         return minsize;

     }


     template <typename T, std::size_t NDIM>

     std::size_t FunctionImpl<T,NDIM>::tree_size() const {

         std::size_t sum = 0;

         sum = coeffs.size();

         world.gop.sum(sum);

         return sum;

     }


     template <typename T, std::size_t NDIM>

     std::size_t FunctionImpl<T,NDIM>::size() const {

         std::size_t sum = 0;

 #if 1

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             const nodeT& node = it->second;

             if (node.has_coeff())

                 sum+=node.size();

         }

         //            print("proc",world.rank(),sum);

 #else

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             const nodeT& node = it->second;

             if (node.has_coeff())

                 ++sum;

         }

         if (is_compressed())

             for (std::size_t i=0; i<NDIM; ++i)

                 sum *= 2*cdata.k;

         else

             for (std::size_t i=0; i<NDIM; ++i)

                 sum *= cdata.k;

 #endif

         world.gop.sum(sum);


         return sum;

     }


     template <typename T, std::size_t NDIM>

     std::size_t FunctionImpl<T,NDIM>::real_size() const {

         std::size_t sum = coeffs.size() * (sizeof(keyT) + sizeof(nodeT));

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             const nodeT& node = it->second;

             if (node.has_coeff()) sum+=node.coeff().real_size();

         }

         world.gop.sum(sum);

         return sum;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::print_size(const std::string name) const {

         const size_t tsize=this->tree_size();

         const size_t size=this->size();

         const size_t rsize=this->real_size();

         const double wall=wall_time();

         const double d=sizeof(T);

         const double fac=1024*1024*1024;


         double norm=0.0;

         {

             double local = norm2sq_local();

             this->world.gop.sum(local);

             this->world.gop.fence();

             norm=sqrt(local);

         }


         if (this->world.rank()==0) {

             printf("%s at time %.1fs: norm/tree/real/size: %7.5f %zu, %6.3f, %6.3f GByte\n",

                    (name.c_str()), wall, norm, tsize,double(rsize)/fac,double(size)/fac*d);

         }

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::print_stats() const {

         if (this->targs.tt==TT_FULL) return;

         int dim=NDIM/2;

         int k0=k;

         if (is_compressed()) k0=2*k;

         Tensor<long> n(int(std::pow(double(k0),double(dim))+1));

         long n_full=0;

         long n_large=0;


         if (world.rank()==0) print("n.size(),k0,dim",n.size(),k0,dim);

         typename dcT::const_iterator end = coeffs.end();

         for (typename dcT::const_iterator it=coeffs.begin(); it!=end; ++it) {

             const nodeT& node = it->second;

             if (node.has_coeff()) {

                 if (node.coeff().rank()>long(n.size())) {

                     ++n_large;

                 } else if (node.coeff().rank()==-1) {

                     ++n_full;

                 } else if (node.coeff().rank()<0) {

                     print("small rank",node.coeff().rank());

                 } else {

                     n[node.coeff().rank()]++;

                 }

             }

         }


         world.gop.sum(n.ptr(), n.size());


         if (world.rank()==0) {

             print("configurations     number of nodes");

             if (world.rank()==0) print("        full rank    ",n_full);

             for (unsigned int i=0; i<n.size(); i++) {

                 long m=n[i];

                 if (world.rank()==0) print("           ",i,"    ",m);

             }

             if (world.rank()==0) print("       large rank    ",n_large);

         }

     }


     template <typename T, std::size_t NDIM>

     T FunctionImpl<T,NDIM>::eval_cube(Level n, coordT& x, const tensorT& c) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         const int k = cdata.k;

         double px[NDIM][k];

         T sum = T(0.0);


         for (std::size_t i=0; i<NDIM; ++i) legendre_scaling_functions(x[i],k,px[i]);


         if (NDIM == 1) {

             for (int p=0; p<k; ++p)

                 sum += c(p)*px[0][p];

         }

         else if (NDIM == 2) {

             for (int p=0; p<k; ++p)

                 for (int q=0; q<k; ++q)

                     sum += c(p,q)*px[0][p]*px[1][q];

         }

         else if (NDIM == 3) {

             for (int p=0; p<k; ++p)

                 for (int q=0; q<k; ++q)

                     for (int r=0; r<k; ++r)

                         sum += c(p,q,r)*px[0][p]*px[1][q]*px[2][r];

         }

         else if (NDIM == 4) {

             for (int p=0; p<k; ++p)

                 for (int q=0; q<k; ++q)

                     for (int r=0; r<k; ++r)

                         for (int s=0; s<k; ++s)

                             sum += c(p,q,r,s)*px[0][p]*px[1][q]*px[2][r]*px[3][s];

         }

         else if (NDIM == 5) {

             for (int p=0; p<k; ++p)

                 for (int q=0; q<k; ++q)

                     for (int r=0; r<k; ++r)

                         for (int s=0; s<k; ++s)

                             for (int t=0; t<k; ++t)

                                 sum += c(p,q,r,s,t)*px[0][p]*px[1][q]*px[2][r]*px[3][s]*px[4][t];

         }

         else if (NDIM == 6) {

             for (int p=0; p<k; ++p)

                 for (int q=0; q<k; ++q)

                     for (int r=0; r<k; ++r)

                         for (int s=0; s<k; ++s)

                             for (int t=0; t<k; ++t)

                                 for (int u=0; u<k; ++u)

                                     sum += c(p,q,r,s,t,u)*px[0][p]*px[1][q]*px[2][r]*px[3][s]*px[4][t]*px[5][u];

         }

         else {

             MADNESS_EXCEPTION("FunctionImpl:eval_cube:NDIM?",NDIM);

         }

         return sum*pow(2.0,0.5*NDIM*n)/sqrt(FunctionDefaults<NDIM>::get_cell_volume());

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::reconstruct_op(const keyT& key, const coeffT& s) {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         // Note that after application of an integral operator not all

         // siblings may be present so it is necessary to check existence

         // and if absent insert an empty leaf node.

         //

         // If summing the result of an integral operator (i.e., from

         // non-standard form) there will be significant scaling function

         // coefficients at all levels and possibly difference coefficients

         // in leaves, hence the tree may refine as a result.

         typename dcT::iterator it = coeffs.find(key).get();

         if (it == coeffs.end()) {

             coeffs.replace(key,nodeT(coeffT(),false));

             it = coeffs.find(key).get();

         }

         nodeT& node = it->second;


         // The integral operator will correctly connect interior nodes

         // to children but may leave interior nodes without coefficients

         // ... but they still need to sum down so just give them zeros

         if (node.has_children() && !node.has_coeff()) {

             node.set_coeff(coeffT(cdata.v2k,targs));

         }


         if (node.has_children() || node.has_coeff()) { // Must allow for inconsistent state from transform, etc.

             coeffT d = node.coeff();

             if (!d.has_data()) d = coeffT(cdata.v2k,targs);

             if (key.level() > 0) d(cdata.s0) += s; // -- note accumulate for NS summation

             if (d.dim(0)==2*get_k()) {              // d might be pre-truncated if it's a leaf

                 d = unfilter(d);

                 node.clear_coeff();

                 node.set_has_children(true);

                 for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                     const keyT& child = kit.key();

                     coeffT ss = copy(d(child_patch(child)));

                     ss.reduce_rank(thresh);

                     PROFILE_BLOCK(recon_send);

                     woT::task(coeffs.owner(child), &implT::reconstruct_op, child, ss);

                 }

             } else {

                 MADNESS_ASSERT(node.is_leaf());

                 //                node.coeff()+=s;

                 node.coeff().reduce_rank(targs.thresh);

             }

         }

         else {

             coeffT ss=s;

             if (s.has_no_data()) ss=coeffT(cdata.vk,targs);

             if (key.level()) node.set_coeff(copy(ss));

             else node.set_coeff(ss);

         }

         return None;

     }


     template <typename T, std::size_t NDIM>

     Tensor<T> fcube(const Key<NDIM>& key, T (*f)(const Vector<double,NDIM>&), const Tensor<double>& qx) {

         //      fcube(key,typename FunctionFactory<T,NDIM>::FunctorInterfaceWrapper(f) , qx, fval);

         std::vector<long> npt(NDIM,qx.dim(0));

         Tensor<T> fval(npt);

         fcube(key,ElementaryInterface<T,NDIM>(f) , qx, fval);

         return fval;

     }


     template <typename T, std::size_t NDIM>

     Tensor<T> fcube(const Key<NDIM>& key, const FunctionFunctorInterface<T,NDIM>& f, const Tensor<double>& qx) {

         //      fcube(key,typename FunctionFactory<T,NDIM>::FunctorInterfaceWrapper(f) , qx, fval);

         std::vector<long> npt(NDIM,qx.dim(0));

         Tensor<T> fval(npt);

         fcube(key, f, qx, fval);

         return fval;

     }


     template <typename T, std::size_t NDIM>

     //    void FunctionImpl<T,NDIM>::fcube(const keyT& key, const FunctionFunctorInterface<T,NDIM>& f, const Tensor<double>& qx, tensorT& fval) const {

     void fcube(const Key<NDIM>& key, const FunctionFunctorInterface<T,NDIM>& f, const Tensor<double>& qx, Tensor<T>& fval) {

         //~ template <typename T, std::size_t NDIM> template< typename FF>

         //~ void FunctionImpl<T,NDIM>::fcube(const keyT& key, const FF& f, const Tensor<double>& qx, tensorT& fval) const {

         typedef Vector<double,NDIM> coordT;

         PROFILE_MEMBER_FUNC(FunctionImpl);

         const Vector<Translation,NDIM>& l = key.translation();

         const Level n = key.level();

         const double h = std::pow(0.5,double(n));

         coordT c; // will hold the point in user coordinates

         const int npt = qx.dim(0);


         const Tensor<double>& cell_width = FunctionDefaults<NDIM>::get_cell_width();

         const Tensor<double>& cell = FunctionDefaults<NDIM>::get_cell();


         // Do pre-screening of the FunctionFunctorInterface, f, before calculating f(r) at quadrature points

         coordT c1, c2;

         for (int i = 0; i < NDIM; i++) {

           c1[i] = cell(i,0) + h*cell_width[i]*(l[i] + qx((long)0));

           c2[i] = cell(i,0) + h*cell_width[i]*(l[i] + qx(npt-1));

         }

         if (f.screened(c1, c2)) {

             fval(___) = 0.0;

             return;

         }


         Tensor<double> vqx;

         bool vectorized = f.supports_vectorized();

         if (vectorized) {

             T* fvptr = fval.ptr();

             if (NDIM == 1) {

                 double* x1 = new double[npt];

                 int idx = 0;

                 for (int i=0; i<npt; ++i, ++idx) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     x1[idx] = c[0];

                 }

                 Vector<double*,1> xvals = vec(x1);

                 f(xvals, fvptr, npt);

                 delete [] x1;

             }

             else if (NDIM == 2) {

                 double* x1 = new double[npt*npt];

                 double* x2 = new double[npt*npt];

                 int idx = 0;

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j, ++idx) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         x1[idx] = c[0];

                         x2[idx] = c[1];

                     }

                 }

                 Vector<double*,2> xvals = vec(x1, x2);

                 f(xvals, fvptr, npt*npt);

                 delete [] x1;

                 delete [] x2;

             }

             else if (NDIM == 3) {

                 double* x1 = new double[npt*npt*npt];

                 double* x2 = new double[npt*npt*npt];

                 double* x3 = new double[npt*npt*npt];

                 int idx = 0;

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k, ++idx) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             x1[idx] = c[0];

                             x2[idx] = c[1];

                             x3[idx] = c[2];

                         }

                     }

                 }

                 Vector<double*,3> xvals = vec(x1, x2, x3);

                 f(xvals, fvptr, npt*npt*npt);

                 delete [] x1;

                 delete [] x2;

                 delete [] x3;

             }

             else if (NDIM == 4) {

                 double* x1 = new double[npt*npt*npt*npt];

                 double* x2 = new double[npt*npt*npt*npt];

                 double* x3 = new double[npt*npt*npt*npt];

                 double* x4 = new double[npt*npt*npt*npt];

                 int idx = 0;

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             for (int m=0; m<npt; ++m, ++idx) {

                                 c[3] = cell(3,0) + h*cell_width[3]*(l[3] + qx(m)); // xx

                                 x1[idx] = c[0];

                                 x2[idx] = c[1];

                                 x3[idx] = c[2];

                                 x4[idx] = c[3];

                             }

                         }

                     }

                 }

                 Vector<double*,4> xvals = vec(x1, x2, x3, x4);

                 f(xvals, fvptr, npt*npt*npt*npt);

                 delete [] x1;

                 delete [] x2;

                 delete [] x3;

                 delete [] x4;

             }

             else if (NDIM == 5) {

                 double* x1 = new double[npt*npt*npt*npt*npt];

                 double* x2 = new double[npt*npt*npt*npt*npt];

                 double* x3 = new double[npt*npt*npt*npt*npt];

                 double* x4 = new double[npt*npt*npt*npt*npt];

                 double* x5 = new double[npt*npt*npt*npt*npt];

                 int idx = 0;

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             for (int m=0; m<npt; ++m) {

                                 c[3] = cell(3,0) + h*cell_width[3]*(l[3] + qx(m)); // xx

                                 for (int n=0; n<npt; ++n, ++idx) {

                                     c[4] = cell(4,0) + h*cell_width[4]*(l[4] + qx(n)); // yy

                                     x1[idx] = c[0];

                                     x2[idx] = c[1];

                                     x3[idx] = c[2];

                                     x4[idx] = c[3];

                                     x5[idx] = c[4];

                                 }

                             }

                         }

                     }

                 }

                 Vector<double*,5> xvals = vec(x1, x2, x3, x4, x5);

                 f(xvals, fvptr, npt*npt*npt*npt*npt);

                 delete [] x1;

                 delete [] x2;

                 delete [] x3;

                 delete [] x4;

                 delete [] x5;

             }

             else if (NDIM == 6) {

                 double* x1 = new double[npt*npt*npt*npt*npt*npt];

                 double* x2 = new double[npt*npt*npt*npt*npt*npt];

                 double* x3 = new double[npt*npt*npt*npt*npt*npt];

                 double* x4 = new double[npt*npt*npt*npt*npt*npt];

                 double* x5 = new double[npt*npt*npt*npt*npt*npt];

                 double* x6 = new double[npt*npt*npt*npt*npt*npt];

                 int idx = 0;

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             for (int m=0; m<npt; ++m) {

                                 c[3] = cell(3,0) + h*cell_width[3]*(l[3] + qx(m)); // xx

                                 for (int n=0; n<npt; ++n) {

                                     c[4] = cell(4,0) + h*cell_width[4]*(l[4] + qx(n)); // yy

                                     for (int p=0; p<npt; ++p, ++idx) {

                                         c[5] = cell(5,0) + h*cell_width[5]*(l[5] + qx(p)); // zz

                                         x1[idx] = c[0];

                                         x2[idx] = c[1];

                                         x3[idx] = c[2];

                                         x4[idx] = c[3];

                                         x5[idx] = c[4];

                                         x6[idx] = c[5];

                                     }

                                 }

                             }

                         }

                     }

                 }

                 Vector<double*,6> xvals = vec(x1, x2, x3, x4, x5, x6);

                 f(xvals, fvptr, npt*npt*npt*npt*npt*npt);

                 delete [] x1;

                 delete [] x2;

                 delete [] x3;

                 delete [] x4;

                 delete [] x5;

                 delete [] x6;

             }

             else {

                 MADNESS_EXCEPTION("FunctionImpl: fcube: confused about NDIM?",NDIM);

             }

         }

         else {

             if (NDIM == 1) {

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     fval(i) = f(c);

                 }

             }

             else if (NDIM == 2) {

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         fval(i,j) = f(c);

                     }

                 }

             }

             else if (NDIM == 3) {

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             fval(i,j,k) = f(c);

                         }

                     }

                 }

             }

             else if (NDIM == 4) {

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             for (int m=0; m<npt; ++m) {

                                 c[3] = cell(3,0) + h*cell_width[3]*(l[3] + qx(m)); // xx

                                 fval(i,j,k,m) = f(c);

                             }

                         }

                     }

                 }

             }

             else if (NDIM == 5) {

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             for (int m=0; m<npt; ++m) {

                                 c[3] = cell(3,0) + h*cell_width[3]*(l[3] + qx(m)); // xx

                                 for (int n=0; n<npt; ++n) {

                                     c[4] = cell(4,0) + h*cell_width[4]*(l[4] + qx(n)); // yy

                                     fval(i,j,k,m,n) = f(c);

                                 }

                             }

                         }

                     }

                 }

             }

             else if (NDIM == 6) {

                 for (int i=0; i<npt; ++i) {

                     c[0] = cell(0,0) + h*cell_width[0]*(l[0] + qx(i)); // x

                     for (int j=0; j<npt; ++j) {

                         c[1] = cell(1,0) + h*cell_width[1]*(l[1] + qx(j)); // y

                         for (int k=0; k<npt; ++k) {

                             c[2] = cell(2,0) + h*cell_width[2]*(l[2] + qx(k)); // z

                             for (int m=0; m<npt; ++m) {

                                 c[3] = cell(3,0) + h*cell_width[3]*(l[3] + qx(m)); // xx

                                 for (int n=0; n<npt; ++n) {

                                     c[4] = cell(4,0) + h*cell_width[4]*(l[4] + qx(n)); // yy

                                     for (int p=0; p<npt; ++p) {

                                         c[5] = cell(5,0) + h*cell_width[5]*(l[5] + qx(p)); // zz

                                         fval(i,j,k,m,n,p) = f(c);

                                     }

                                 }

                             }

                         }

                     }

                 }

             }

             else {

                 MADNESS_EXCEPTION("FunctionImpl: fcube: confused about NDIM?",NDIM);

             }

         }

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::fcube(const keyT& key, T (*f)(const coordT&), const Tensor<double>& qx, tensorT& fval) const {

         //      fcube(key,typename FunctionFactory<T,NDIM>::FunctorInterfaceWrapper(f) , qx, fval);

         madness::fcube(key,ElementaryInterface<T,NDIM>(f) , qx, fval);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::fcube(const keyT& key, const FunctionFunctorInterface<T,NDIM>& f, const Tensor<double>& qx, tensorT& fval) const {

         madness::fcube(key,f,qx,fval);

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::project_refine_op(const keyT& key,

                                                  bool do_refine,

                                                  const std::vector<Vector<double,NDIM> >& specialpts) {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         if (do_refine && key.level() < max_refine_level) {


             // Restrict special points to this box

             std::vector<Vector<double,NDIM> > newspecialpts;

             if (key.level() < functor->special_level() && specialpts.size() > 0) {

                 BoundaryConditions<NDIM> bc = FunctionDefaults<NDIM>::get_bc();

                 std::vector<bool> bperiodic = bc.is_periodic();

                 for (unsigned int i = 0; i < specialpts.size(); ++i) {

                     coordT simpt;

                     user_to_sim(specialpts[i], simpt);

                     Key<NDIM> specialkey = simpt2key(simpt, key.level());

                     if (specialkey.is_neighbor_of(key,bperiodic)) {

                         newspecialpts.push_back(specialpts[i]);

                     }

                 }

             }


             // If refining compute scaling function coefficients and

             // norm of difference coefficients

             tensorT r, s0;

             double dnorm = 0.0;

             {

                 // Make in r child scaling function coeffs at level n+1

                 r = tensorT(cdata.v2k);

                 for (KeyChildIterator<NDIM> it(key); it; ++it) {

                     const keyT& child = it.key();

                     r(child_patch(child)) = project(child);

                 }

                 // Filter then test difference coeffs at level n

                 tensorT d = filter(r);

                 if (truncate_on_project) s0 = copy(d(cdata.s0));

                 d(cdata.s0) = T(0);

                 dnorm = d.normf();

             }


             // If have special points always refine.  If don't have special points

             // refine if difference norm is big

             if (newspecialpts.size() > 0 || dnorm >=truncate_tol(thresh,key.level())) {

                 coeffs.replace(key,nodeT(coeffT(),true)); // Insert empty node for parent

                 for (KeyChildIterator<NDIM> it(key); it; ++it) {

                     const keyT& child = it.key();

                     ProcessID p;

                     if (FunctionDefaults<NDIM>::get_project_randomize()) {

                         p = world.random_proc();

                     }

                     else {

                         p = coeffs.owner(child);

                     }

                     PROFILE_BLOCK(proj_refine_send);

                     woT::task(p, &implT::project_refine_op, child, do_refine, newspecialpts);

                 }

             }

             else {

                 if (truncate_on_project) {

                     coeffT s(s0,thresh,FunctionDefaults<NDIM>::get_tensor_type());

                     coeffs.replace(key,nodeT(s,false));

                 }

                 else {

                     coeffs.replace(key,nodeT(coeffT(),true)); // Insert empty node for parent

                     for (KeyChildIterator<NDIM> it(key); it; ++it) {

                         const keyT& child = it.key();

                         coeffT s(r(child_patch(child)),thresh,FunctionDefaults<NDIM>::get_tensor_type());

                         coeffs.replace(child,nodeT(s,false));

                     }

                 }

             }

         }

         else {

             coeffs.replace(key,nodeT(coeffT(project(key),targs),false));

         }

         return None;

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::add_scalar_inplace(T t, bool fence) {

         std::vector<long> v0(NDIM,0L);

         std::vector<long> v1(NDIM,1L);

         std::vector<Slice> s(NDIM,Slice(0,0));

         const TensorArgs full_args(-1.0,TT_FULL);

         if (is_compressed()) {

             if (world.rank() == coeffs.owner(cdata.key0)) {

                 typename dcT::iterator it = coeffs.find(cdata.key0).get();

                 MADNESS_ASSERT(it != coeffs.end());

                 nodeT& node = it->second;

                 MADNESS_ASSERT(node.has_coeff());

                 //                node.node_to_full_rank();

                 //                node.full_tensor_reference()(v0) += t*sqrt(FunctionDefaults<NDIM>::get_cell_volume());

                 //                node.node_to_low_rank();

                 change_tensor_type(node.coeff(),full_args);

                 node.coeff().full_tensor()(v0) += t*sqrt(FunctionDefaults<NDIM>::get_cell_volume());

                 change_tensor_type(node.coeff(),targs);

             }

         }

         else {

             for (typename dcT::iterator it=coeffs.begin(); it!=coeffs.end(); ++it) {

                 Level n = it->first.level();

                 nodeT& node = it->second;

                 if (node.has_coeff()) {

                     // this looks funny, but is necessary for GenTensor, since you can't access a

                     // single matrix element. Therefore make a (1^NDIM) tensor, convert to GenTensor, then

                     // add to the original one by adding a slice.

                     tensorT ttt(v1);

                     ttt=t*sqrt(FunctionDefaults<NDIM>::get_cell_volume()*pow(0.5,double(NDIM*n)));

                     coeffT tt(ttt,get_tensor_args());

                     node.coeff()(s) += tt;

                     // this was the original line:

                     // node.coeff().full_tensor()(v0) += t*sqrt(FunctionDefaults<NDIM>::get_cell_volume()*pow(0.5,double(NDIM*n)));


                 }

             }

         }

         if (fence) world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::insert_zero_down_to_initial_level(const keyT& key) {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         if (compressed) initial_level = std::max(initial_level,1); // Otherwise zero function is confused

         if (coeffs.is_local(key)) {

             if (compressed) {

                 if (key.level() == initial_level) {

                     coeffs.replace(key, nodeT(coeffT(), false));

                 }

                 else {

                     coeffs.replace(key, nodeT(coeffT(cdata.v2k,targs), true));

                 }

             }

             else {

                 if (key.level()<initial_level) {

                     coeffs.replace(key, nodeT(coeffT(), true));

                 }

                 else {

                     coeffs.replace(key, nodeT(coeffT(cdata.vk,targs), false));

                 }

             }

         }

         if (key.level() < initial_level) {

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                 insert_zero_down_to_initial_level(kit.key());

             }

         }


     }


     template <typename T, std::size_t NDIM>

     Future<bool> FunctionImpl<T,NDIM>::truncate_spawn(const keyT& key, double tol) {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         typename dcT::iterator it = coeffs.find(key).get();

         if (it == coeffs.end()) {

             // In a standard tree all children would exist but some ops (transform)

             // can leave the tree in a messy state.  Just make the missing node as an

             // empty leaf.

             coeffs.replace(key,nodeT());

             it = coeffs.find(key).get();

         }

         nodeT& node = it->second;

         if (node.has_children()) {

             std::vector< Future<bool> > v = future_vector_factory<bool>(1<<NDIM);

             int i=0;

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {

                 v[i] = woT::task(coeffs.owner(kit.key()), &implT::truncate_spawn, kit.key(), tol, TaskAttributes::generator());

             }

             return woT::task(world.rank(),&implT::truncate_op, key, tol, v);

         }

         else {

             // In compressed form leaves should not have coeffs ... however the

             // transform op could leave the tree with leaves that do have coeffs

             // in which case we want something sensible to happen

             //MADNESS_ASSERT(!node.has_coeff());

             if (node.has_coeff() && key.level()>1) {

                 double dnorm = node.coeff().normf();

                 if (dnorm < truncate_tol(tol,key)) {

                     node.clear_coeff();

                 }

             }

             return Future<bool>(node.has_coeff());

         }

     }


     template <typename T, std::size_t NDIM>

     bool FunctionImpl<T,NDIM>::truncate_op(const keyT& key, double tol, const std::vector< Future<bool> >& v) {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         // If any child has coefficients, a parent cannot truncate

         for (int i=0; i<(1<<NDIM); ++i) if (v[i].get()) return true;

         nodeT& node = coeffs.find(key).get()->second;


         // Interior nodes should always have coeffs but transform might

         // leave empty interior nodes ... hence just force no coeffs to

         // be zero coeff unless it is a leaf.

         if (node.has_children() && !node.has_coeff()) node.set_coeff(coeffT(cdata.v2k,targs));


         if (key.level() > 1) { // >1 rather >0 otherwise reconstruct might get confused

             double dnorm = node.coeff().normf();

             if (dnorm < truncate_tol(tol,key)) {

                 node.clear_coeff();

                 if (node.has_children()) {

                     node.set_has_children(false);

                     for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                         coeffs.erase(kit.key());

                     }

                 }

             }

         }

         return node.has_coeff();

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::print_tree(std::ostream& os, Level maxlevel) const {

         if (world.rank() == 0) do_print_tree(cdata.key0, os, maxlevel);

         world.gop.fence();

         if (world.rank() == 0) os.flush();

         world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::do_print_tree(const keyT& key, std::ostream& os, Level maxlevel) const {

         typename dcT::const_iterator it = coeffs.find(key).get();

         if (it == coeffs.end()) {

             //MADNESS_EXCEPTION("FunctionImpl: do_print_tree: null node pointer",0);

             for (int i=0; i<key.level(); ++i) os << "  ";

             os << key << "  missing --> " << coeffs.owner(key) << "\n";

         }

         else {

             const nodeT& node = it->second;

             for (int i=0; i<key.level(); ++i) os << "  ";

             os << key << "  " << node << " --> " << coeffs.owner(key) << "\n";

             if (key.level() < maxlevel  &&  node.has_children()) {

                 for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                     do_print_tree(kit.key(),os,maxlevel);

                 }

             }

         }

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::print_tree_graphviz(std::ostream& os, Level maxlevel) const {

         if (world.rank() == 0) do_print_tree_graphviz(cdata.key0, os, maxlevel);

         world.gop.fence();

         if (world.rank() == 0) os.flush();

         world.gop.fence();

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::do_print_tree_graphviz(const keyT& key, std::ostream& os, Level maxlevel) const {


         struct uniqhash {

             static int64_t value(const keyT& key) {

                 int64_t result = 0;

                 for (int64_t j = 0; j <= key.level()-1; ++j) {

                     result += (1 << j*NDIM);

                 }

                 result += key.translation()[0];

                 return result;

             }

         };


         typename dcT::const_iterator it = coeffs.find(key).get();

         if (it != coeffs.end()) {

             const nodeT& node = it->second;

             if (key.level() < maxlevel  &&  node.has_children()) {

                 for (KeyChildIterator<NDIM> kit(key); kit; ++kit) {

                     os << uniqhash::value(key) << " -> " << uniqhash::value(kit.key()) << "\n";

                     do_print_tree_graphviz(kit.key(),os,maxlevel);

                 }

             }

         }

     }


     template <typename T, std::size_t NDIM>

     Tensor<T> FunctionImpl<T,NDIM>::project(const keyT& key) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);


         if (not functor) MADNESS_EXCEPTION("FunctionImpl: project: confusion about function?",0);


         // if functor provides coeffs directly, awesome; otherwise use compute by yourself

         if (functor->provides_coeff()) return functor->coeff(key).full_tensor_copy();


         MADNESS_ASSERT(cdata.npt == cdata.k); // only necessary due to use of fast transform

         tensorT fval(cdata.vq,false); // this will be the returned result

         tensorT work(cdata.vk,false); // initially evaluate the function in here

         tensorT workq(cdata.vq,false); // initially evaluate the function in here


         madness::fcube(key,*functor,cdata.quad_x,work);


         work.scale(sqrt(FunctionDefaults<NDIM>::get_cell_volume()*pow(0.5,double(NDIM*key.level()))));

         //return transform(work,cdata.quad_phiw);

         return fast_transform(work,cdata.quad_phiw,fval,workq);

     }


     template <typename T, std::size_t NDIM>

     Future<double> FunctionImpl<T,NDIM>::get_norm_tree_recursive(const keyT& key) const {

         if (coeffs.probe(key)) {

             return Future<double>(coeffs.find(key).get()->second.get_norm_tree());

         }

         MADNESS_ASSERT(key.level());

         keyT parent = key.parent();

         return woT::task(coeffs.owner(parent), &implT::get_norm_tree_recursive, parent, TaskAttributes::hipri());

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::sock_it_to_me(const keyT& key,

                                              const RemoteReference< FutureImpl< std::pair<keyT,coeffT> > >& ref) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         if (coeffs.probe(key)) {

             const nodeT& node = coeffs.find(key).get()->second;

             Future< std::pair<keyT,coeffT> > result(ref);

             if (node.has_coeff()) {

                 //madness::print("sock found it with coeff",key);

                 result.set(std::pair<keyT,coeffT>(key,node.coeff()));

             }

             else {

                 //madness::print("sock found it without coeff",key);

                 result.set(std::pair<keyT,coeffT>(key,coeffT()));

             }

         }

         else {

             keyT parent = key.parent();

             //madness::print("sock forwarding to parent",key,parent);

             PROFILE_BLOCK(sitome_send);

             woT::task(coeffs.owner(parent), &FunctionImpl<T,NDIM>::sock_it_to_me, parent, ref, TaskAttributes::hipri());

         }

         return None;

     }


     // like sock_it_to_me, but it replaces empty node with averaged coeffs from further down the tree

     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::sock_it_to_me_too(const keyT& key,

                                                  const RemoteReference< FutureImpl< std::pair<keyT,coeffT> > >& ref) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         if (coeffs.probe(key)) {

             const nodeT& node = coeffs.find(key).get()->second;

             Future< std::pair<keyT,coeffT> > result(ref);

             if (node.has_coeff()) {

                 result.set(std::pair<keyT,coeffT>(key,node.coeff()));

             }

             else {

                 result.set(std::pair<keyT,coeffT>(key,nodeT(coeffT(project(key),targs),false).coeff()));

             }

         }

         else {

             keyT parent = key.parent();

             PROFILE_BLOCK(sitome2_send);

             woT::task(coeffs.owner(parent), &FunctionImpl<T,NDIM>::sock_it_to_me_too, parent, ref, TaskAttributes::hipri());

         }

         return None;

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::eval(const Vector<double,NDIM>& xin,

                                     const keyT& keyin,

                                     const typename Future<T>::remote_refT& ref) {


         PROFILE_MEMBER_FUNC(FunctionImpl);

         // This is ugly.  We must figure out a clean way to use

         // owner computes rule from the container.

         Vector<double,NDIM> x = xin;

         keyT key = keyin;

         Vector<Translation,NDIM> l = key.translation();

         ProcessID me = world.rank();

         while (1) {

             ProcessID owner = coeffs.owner(key);

             if (owner != me) {

                 PROFILE_BLOCK(eval_send);

                 woT::task(owner, &implT::eval, x, key, ref, TaskAttributes::hipri());

                 return None;

             }

             else {

                 typename dcT::futureT fut = coeffs.find(key);

                 typename dcT::iterator it = fut.get();

                 nodeT& node = it->second;

                 if (node.has_coeff()) {

                     Future<T>(ref).set(eval_cube(key.level(), x, node.coeff().full_tensor_copy()));

                     return None;

                 }

                 else {

                     for (std::size_t i=0; i<NDIM; ++i) {

                         double xi = x[i]*2.0;

                         int li = int(xi);

                         if (li == 2) li = 1;

                         x[i] = xi - li;

                         l[i] = 2*l[i] + li;

                     }

                     key = keyT(key.level()+1,l);

                 }

             }

         }

         //MADNESS_EXCEPTION("should not be here",0);

     }


     template <typename T, std::size_t NDIM>

     std::pair<bool,T>

     FunctionImpl<T,NDIM>::eval_local_only(const Vector<double,NDIM>& xin, Level maxlevel) {

         Vector<double,NDIM> x = xin;

         keyT key(0);

         Vector<Translation,NDIM> l = key.translation();

         const ProcessID me = world.rank();

         while (key.level() <= maxlevel) {

             if (coeffs.owner(key) == me) {

                 typename dcT::futureT fut = coeffs.find(key);

                 typename dcT::iterator it = fut.get();

                 if (it != coeffs.end()) {

                     nodeT& node = it->second;

                     if (node.has_coeff()) {

                         return std::pair<bool,T>(true,eval_cube(key.level(), x, node.coeff().full_tensor_copy()));

                     }

                 }

             }

             for (std::size_t i=0; i<NDIM; ++i) {

                 double xi = x[i]*2.0;

                 int li = int(xi);

                 if (li == 2) li = 1;

                 x[i] = xi - li;

                 l[i] = 2*l[i] + li;

             }

             key = keyT(key.level()+1,l);

         }

         return std::pair<bool,T>(false,0.0);

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::evaldepthpt(const Vector<double,NDIM>& xin,

                                            const keyT& keyin,

                                            const typename Future<Level>::remote_refT& ref) {


         PROFILE_MEMBER_FUNC(FunctionImpl);

         // This is ugly.  We must figure out a clean way to use

         // owner computes rule from the container.

         Vector<double,NDIM> x = xin;

         keyT key = keyin;

         Vector<Translation,NDIM> l = key.translation();

         ProcessID me = world.rank();

         while (1) {

             ProcessID owner = coeffs.owner(key);

             if (owner != me) {

                 PROFILE_BLOCK(eval_send);

                 woT::task(owner, &implT::evaldepthpt, x, key, ref, TaskAttributes::hipri());

                 return None;

             }

             else {

                 typename dcT::futureT fut = coeffs.find(key);

                 typename dcT::iterator it = fut.get();

                 nodeT& node = it->second;

                 if (node.has_coeff()) {

                     Future<Level>(ref).set(key.level());

                     return None;

                 }

                 else {

                     for (std::size_t i=0; i<NDIM; ++i) {

                         double xi = x[i]*2.0;

                         int li = int(xi);

                         if (li == 2) li = 1;

                         x[i] = xi - li;

                         l[i] = 2*l[i] + li;

                     }

                     key = keyT(key.level()+1,l);

                 }

             }

         }

         //MADNESS_EXCEPTION("should not be here",0);

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::evalR(const Vector<double,NDIM>& xin,

                                      const keyT& keyin,

                                      const typename Future<long>::remote_refT& ref) {


         PROFILE_MEMBER_FUNC(FunctionImpl);

         // This is ugly.  We must figure out a clean way to use

         // owner computes rule from the container.

         Vector<double,NDIM> x = xin;

         keyT key = keyin;

         Vector<Translation,NDIM> l = key.translation();

         ProcessID me = world.rank();

         while (1) {

             ProcessID owner = coeffs.owner(key);

             if (owner != me) {

                 PROFILE_BLOCK(eval_send);

                 woT::task(owner, &implT::evalR, x, key, ref, TaskAttributes::hipri());

                 return None;

             }

             else {

                 typename dcT::futureT fut = coeffs.find(key);

                 typename dcT::iterator it = fut.get();

                 nodeT& node = it->second;

                 if (node.has_coeff()) {

                     Future<long>(ref).set(node.coeff().rank());

                     return None;

                 }

                 else {

                     for (std::size_t i=0; i<NDIM; ++i) {

                         double xi = x[i]*2.0;

                         int li = int(xi);

                         if (li == 2) li = 1;

                         x[i] = xi - li;

                         l[i] = 2*l[i] + li;

                     }

                     key = keyT(key.level()+1,l);

                 }

             }

         }

         //MADNESS_EXCEPTION("should not be here",0);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::tnorm(const tensorT& t, double* lo, double* hi) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         // Chosen approach looks stupid but it is more accurate

         // than the simple approach of summing everything and

         // subtracting off the low-order stuff to get the high

         // order (assuming the high-order stuff is small relative

         // to the low-order)

         tensorT work = copy(t);

         tensorT tlo = work(cdata.sh);

         *lo = tlo.normf();

         tlo.fill(0.0);

         *hi = work.normf();

     }


     namespace detail {

         template <typename A, typename B>

         struct noop {

             void operator()(const A& a, const B& b) const {};


             template <typename Archive> void serialize(Archive& ar) {}

         };


         template <typename T, std::size_t NDIM>

         struct scaleinplace {

             T q;

             scaleinplace() {}

             // G++ 4.1.2 ICEs on BGP ... scaleinplace(T q) : q(q) {}

             scaleinplace(T q) {this->q = q;}

             void operator()(const Key<NDIM>& key, Tensor<T>& t) const {

                 t.scale(q);

             }

             void operator()(const Key<NDIM>& key, FunctionNode<T,NDIM>& node) const {

                 node.coeff().scale(q);

             }

             template <typename Archive> void serialize(Archive& ar) {

                 ar & q;

             }

         };


         template <typename T, std::size_t NDIM>

         struct squareinplace {

             void operator()(const Key<NDIM>& key, Tensor<T>& t) const {

                 t.emul(t);

             }

             template <typename Archive> void serialize(Archive& ar) {}

         };


         template <typename T, std::size_t NDIM>

         struct absinplace {

             void operator()(const Key<NDIM>& key, Tensor<T>& t) const {t=abs(t);}

             template <typename Archive> void serialize(Archive& ar) {}

         };


         template <typename T, std::size_t NDIM>

         struct abssquareinplace {

             void operator()(const Key<NDIM>& key, Tensor<T>& t) const {abs(t.emul(t));}

             template <typename Archive> void serialize(Archive& ar) {}

         };

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::scale_inplace(const T q, bool fence) {

         //        unary_op_coeff_inplace(detail::scaleinplace<T,NDIM>(q), fence);

         unary_op_node_inplace(detail::scaleinplace<T,NDIM>(q), fence);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::square_inplace(bool fence) {

         //unary_op_value_inplace(&implT::autorefine_square_test, detail::squareinplace<T,NDIM>(), fence);

         unary_op_value_inplace(detail::squareinplace<T,NDIM>(), fence);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::abs_inplace(bool fence) {

         unary_op_value_inplace(detail::absinplace<T,NDIM>(), fence);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::abs_square_inplace(bool fence) {

         unary_op_value_inplace(detail::abssquareinplace<T,NDIM>(), fence);

     }


     template <typename T, std::size_t NDIM>

     void FunctionImpl<T,NDIM>::phi_for_mul(Level np, Translation lp, Level nc, Translation lc, Tensor<double>& phi) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         double p[200];

         double scale = pow(2.0,double(np-nc));

         for (int mu=0; mu<cdata.npt; ++mu) {

             double xmu = scale*(cdata.quad_x(mu)+lc) - lp;

             MADNESS_ASSERT(xmu>-1e-15 && xmu<(1+1e-15));

             legendre_scaling_functions(xmu,cdata.k,p);

             for (int i=0; i<k; ++i) phi(i,mu) = p[i];

         }

         phi.scale(pow(2.0,0.5*np));

     }


     template <typename T, std::size_t NDIM>


     const GenTensor<T> FunctionImpl<T,NDIM>::parent_to_child(const coeffT& s, const keyT& parent, const keyT& child) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         // An invalid parent/child means that they are out of the box

         // and it is the responsibility of the caller to worry about that

         // ... most likely the coefficients (s) are zero to reflect

         // zero B.C. so returning s makes handling this easy.

         if (parent == child || parent.is_invalid() || child.is_invalid()) return s;


         coeffT result = fcube_for_mul<T>(child, parent, s);

         result.scale(sqrt(FunctionDefaults<NDIM>::get_cell_volume()*pow(0.5,double(NDIM*child.level()))));

         result = transform(result,cdata.quad_phiw);


         return result;

     }


     template <typename T, std::size_t NDIM>

     T FunctionImpl<T,NDIM>::trace_local() const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         std::vector<long> v0(NDIM,0);

         T sum = 0.0;

         if (compressed) {

             if (world.rank() == coeffs.owner(cdata.key0)) {

                 typename dcT::const_iterator it = coeffs.find(cdata.key0).get();

                 if (it != coeffs.end()) {

                     const nodeT& node = it->second;

                     if (node.has_coeff()) sum = node.coeff().full_tensor_copy()(v0);

                 }

             }

         }

         else {

             for (typename dcT::const_iterator it=coeffs.begin(); it!=coeffs.end(); ++it) {

                 const keyT& key = it->first;

                 const nodeT& node = it->second;

                 if (node.has_coeff()) sum += node.coeff().full_tensor_copy()(v0)*pow(0.5,NDIM*key.level()*0.5);

             }

         }

         return sum*sqrt(FunctionDefaults<NDIM>::get_cell_volume());

     }


     static inline bool enforce_bc(bool is_periodic, Level n, Translation& l) {

         Translation two2n = 1ul << n;

         if (l < 0) {

             if (is_periodic)

                 l += two2n; // Periodic BC

             else

                 return false; // Zero BC

         }

         else if (l >= two2n) {

             if (is_periodic)

                 l -= two2n; // Periodic BC

             else

                 return false; // Zero BC

         }

         return true;

     }


     template <typename T, std::size_t NDIM>

     Key<NDIM> FunctionImpl<T,NDIM>::neighbor(const keyT& key, const Key<NDIM>& disp, const std::vector<bool>& is_periodic) const {

         Vector<Translation,NDIM> l = key.translation();


         for (std::size_t axis=0; axis<NDIM; ++axis) {

             l[axis] += disp.translation()[axis];


             //if (!enforce_bc(bc(axis,0), bc(axis,1), key.level(), l[axis])) {

             if (!enforce_bc(is_periodic[axis], key.level(), l[axis])) {

                 return keyT::invalid();

             }

         }

         return keyT(key.level(),l);

     }


     template <typename T, std::size_t NDIM>

     Future< std::pair< Key<NDIM>, GenTensor<T> > >

     FunctionImpl<T,NDIM>::find_me(const Key<NDIM>& key) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         typedef std::pair< Key<NDIM>,coeffT > argT;

         Future<argT> result;

         PROFILE_BLOCK(find_me_send);

         woT::task(coeffs.owner(key), &implT::sock_it_to_me_too, key, result.remote_ref(world), TaskAttributes::hipri());

         return result;

     }


     template <typename T, std::size_t NDIM>

     Future< GenTensor<T> > FunctionImpl<T,NDIM>::compress_spawn(const Key<NDIM>& key,

                                                                 bool nonstandard, bool keepleaves, bool redundant) {

         if (!coeffs.probe(key)) print("missing node",key);

         MADNESS_ASSERT(coeffs.probe(key));


         // get fetches remote data (here actually local)

         nodeT& node = coeffs.find(key).get()->second;

         if (node.has_children()) {

             std::vector< Future<coeffT > > v = future_vector_factory<coeffT >(1<<NDIM);

             int i=0;

             for (KeyChildIterator<NDIM> kit(key); kit; ++kit,++i) {

                 PROFILE_BLOCK(compress_send);

                 // readily available

                 v[i] = woT::task(coeffs.owner(kit.key()), &implT::compress_spawn, kit.key(),

                                  nonstandard, keepleaves, redundant, TaskAttributes::hipri());

             }

             if (redundant) return woT::task(world.rank(),&implT::make_redundant_op, key, v);

             return woT::task(world.rank(),&implT::compress_op, key, v, nonstandard, redundant);

         }

         else {

             Future<coeffT > result(node.coeff());

             if (!keepleaves) node.clear_coeff();

             return result;

         }

     }


     template <typename T, std::size_t NDIM>

     Void FunctionImpl<T,NDIM>::plot_cube_kernel(archive::archive_ptr< Tensor<T> > ptr,

                                                 const keyT& key,

                                                 const coordT& plotlo, const coordT& plothi, const std::vector<long>& npt,

                                                 bool eval_refine) const {


         Tensor<T>& r = *ptr;


         coordT h; // Increment between points in each dimension

         for (std::size_t i=0; i<NDIM; ++i) {

             if (npt[i] > 1) {

                 h[i] = (plothi[i]-plotlo[i])/(npt[i]-1);

             }

             else {

                 MADNESS_ASSERT(plotlo[i] == plothi[i]);

                 h[i] = 0.0;

             }

         }


         const Level n = key.level();

         const Vector<Translation,NDIM>& l = key.translation();

         const double twon = pow(2.0,double(n));

         const tensorT& coeff = coeffs.find(key).get()->second.coeff().full_tensor_copy(); // Ugh!

         //        const tensorT coeff = coeffs.find(key).get()->second.full_tensor_copy(); // Ugh!

         long ind[NDIM];

         coordT x;


         coordT boxlo, boxhi;

         Vector<int,NDIM> boxnpt;

         double fac = pow(0.5,double(key.level()));

         int npttotal = 1;

         for (std::size_t d=0; d<NDIM; ++d) {

             // Coords of box

             boxlo[d] = fac*key.translation()[d];

             boxhi[d] = boxlo[d]+fac;


             if (boxlo[d] > plothi[d] || boxhi[d] < plotlo[d]) {

                 // Discard boxes out of the plot range

                 npttotal = boxnpt[d] = 0;

                 //print("OO range?");

                 break;

             }

             else if (npt[d] == 1) {

                 // This dimension is only a single point

                 boxlo[d] = boxhi[d] = plotlo[d];

                 boxnpt[d] = 1;

             }

             else {

                 // Restrict to plot range

                 boxlo[d] = std::max(boxlo[d],plotlo[d]);

                 boxhi[d] = std::min(boxhi[d],plothi[d]);


                 // Round lo up to next plot point; round hi down

                 double xlo = long((boxlo[d]-plotlo[d])/h[d])*h[d] + plotlo[d];

                 if (xlo < boxlo[d]) xlo += h[d];

                 boxlo[d] =  xlo;

                 double xhi = long((boxhi[d]-plotlo[d])/h[d])*h[d] + plotlo[d];

                 if (xhi > boxhi[d]) xhi -= h[d];

                 // MADNESS_ASSERT(xhi >= xlo);  // nope

                 boxhi[d] = xhi;

                 boxnpt[d] = long(round((boxhi[d] - boxlo[d])/h[d])) + 1;

             }

             npttotal *= boxnpt[d];

         }

         //print("    box", boxlo, boxhi, boxnpt, npttotal);

         if (npttotal > 0) {

             for (IndexIterator it(boxnpt); it; ++it) {

                 for (std::size_t d=0; d<NDIM; ++d) {

                     double xd = boxlo[d] + it[d]*h[d]; // Sim. coords of point

                     x[d] = twon*xd - l[d]; // Offset within box

                     MADNESS_ASSERT(x[d]>=0.0 && x[d] <=1.0);  // sanity

                     if (npt[d] > 1) {

                         ind[d] = long(round((xd-plotlo[d])/h[d])); // Index of plot point

                     }

                     else {

                         ind[d] = 0;

                     }

                     MADNESS_ASSERT(ind[d]>=0 && ind[d]<npt[d]); // sanity

                 }

                 if (eval_refine) {

                     r(ind) = n;

                 }

                 else {

                     T tmp = eval_cube(n, x, coeff);

                     r(ind) = tmp;

                     //print("    eval", ind, tmp, r(ind));

                 }

             }

         }


         return None;

     }


     template <typename T, std::size_t NDIM>

     Tensor<T> FunctionImpl<T,NDIM>::eval_plot_cube(const coordT& plotlo,

                                                    const coordT& plothi,

                                                    const std::vector<long>& npt,

                                                    const bool eval_refine) const {

         PROFILE_MEMBER_FUNC(FunctionImpl);

         Tensor<T> r(NDIM, &npt[0]);

         //r(___) = 99.0;

         MADNESS_ASSERT(!compressed);


         for (typename dcT::const_iterator it=coeffs.begin(); it!=coeffs.end(); ++it) {

             const keyT& key = it->first;

             const nodeT& node = it->second;

             if (node.has_coeff()) {

                 woT::task(world.rank(), &implT::plot_cube_kernel,

                           archive::archive_ptr< Tensor<T> >(&r), key, plotlo, plothi, npt, eval_refine);

             }

         }


         //        ITERATOR(r, if (r(IND) == 99.0) {print("BAD", IND); error("bad",0);});


         world.taskq.fence();

         world.gop.sum(r.ptr(), r.size());

         world.gop.fence();


         return r;

     }


     static inline void dxprintvalue(FILE* f, const double t) {

         fprintf(f,"%.6e\n",t);

     }


     static inline void dxprintvalue(FILE* f, const double_complex& t) {

         fprintf(f,"%.6e %.6e\n", t.real(), t.imag());

     }


     template <typename T, std::size_t NDIM>

     void plotdx(const Function<T,NDIM>& function,

                 const char* filename,

                 const Tensor<double>& cell,

                 const std::vector<long>& npt,

                 bool binary) {

         PROFILE_FUNC;

         MADNESS_ASSERT(NDIM<=6);

         const char* element[6] = {"lines","quads","cubes","cubes4D","cubes5D","cubes6D"};


         function.verify();

         World& world = const_cast< Function<T,NDIM>& >(function).world();

         FILE *f=0;

         if (world.rank() == 0) {

             f = fopen(filename, "w");

             if (!f) MADNESS_EXCEPTION("plotdx: failed to open the plot file", 0);


             fprintf(f,"object 1 class gridpositions counts ");

             for (std::size_t d=0; d<NDIM; ++d) fprintf(f," %ld",npt[d]);

             fprintf(f,"\n");


             fprintf(f,"origin ");

             for (std::size_t d=0; d<NDIM; ++d) fprintf(f, " %.6e", cell(d,0));

             fprintf(f,"\n");


             for (std::size_t d=0; d<NDIM; ++d) {

                 fprintf(f,"delta ");

                 for (std::size_t c=0; c<d; ++c) fprintf(f, " 0");

                 double h = 0.0;

                 if (npt[d]>1) h = (cell(d,1)-cell(d,0))/(npt[d]-1);

                 fprintf(f," %.6e", h);

                 for (std::size_t c=d+1; c<NDIM; ++c) fprintf(f, " 0");

                 fprintf(f,"\n");

             }

             fprintf(f,"\n");


             fprintf(f,"object 2 class gridconnections counts ");

             for (std::size_t d=0; d<NDIM; ++d) fprintf(f," %ld",npt[d]);

             fprintf(f,"\n");

             fprintf(f, "attribute \"element type\" string \"%s\"\n", element[NDIM-1]);

             fprintf(f, "attribute \"ref\" string \"positions\"\n");

             fprintf(f,"\n");


             int npoint = 1;

             for (std::size_t d=0; d<NDIM; ++d) npoint *= npt[d];

             const char* iscomplex = "";

             if (TensorTypeData<T>::iscomplex) iscomplex = "category complex";

             const char* isbinary = "";

             if (binary) isbinary = "binary";

             fprintf(f,"object 3 class array type double %s rank 0 items %d %s data follows\n",

                     iscomplex, npoint, isbinary);

         }


         world.gop.fence();

         Tensor<T> r = function.eval_cube(cell, npt);


         if (world.rank() == 0) {

             if (binary) {

                 // This assumes that the values are double precision

                 fflush(f);

                 fwrite((void *) r.ptr(), sizeof(T), r.size(), f);

                 fflush(f);

             }

             else {

                 for (IndexIterator it(npt); it; ++it) {

                     //fprintf(f,"%.6e\n",r(*it));

                     dxprintvalue(f,r(*it));

                 }

             }

             fprintf(f,"\n");


             fprintf(f,"object \"%s\" class field\n",filename);

             fprintf(f,"component \"positions\" value 1\n");

             fprintf(f,"component \"connections\" value 2\n");

             fprintf(f,"component \"data\" value 3\n");

             fprintf(f,"\nend\n");

             fclose(f);

         }

         world.gop.fence();

     }


     template <std::size_t NDIM>

     void FunctionDefaults<NDIM>::set_defaults(World& world) {

         k = 6;

         thresh = 1e-4;

         initial_level = 2;

         max_refine_level = 30;

         truncate_mode = 0;

         refine = true;

         autorefine = true;

         debug = false;

         truncate_on_project = true;

         apply_randomize = false;

         project_randomize = false;

         bc = BoundaryConditions<NDIM>(BC_FREE);

         tt = TT_FULL;

         cell = Tensor<double>(NDIM,2);

         cell(_,1) = 1.0;

         recompute_cell_info();


         //pmap = std::shared_ptr< WorldDCPmapInterface< Key<NDIM> > >(new WorldDCDefaultPmap< Key<NDIM> >(world));

         pmap = std::shared_ptr< WorldDCPmapInterface< Key<NDIM> > >(new madness::LevelPmap< Key<NDIM> >(world));

         //pmap = std::shared_ptr< WorldDCPmapInterface< Key<NDIM> > >(new SimplePmap< Key<NDIM> >(world));

     }


     template <typename T, std::size_t NDIM>

     const FunctionCommonData<T,NDIM>* FunctionCommonData<T,NDIM>::data[MAXK] = {0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0};


     template <std::size_t NDIM> int FunctionDefaults<NDIM>::k;

     template <std::size_t NDIM> double FunctionDefaults<NDIM>::thresh;

     template <std::size_t NDIM> int FunctionDefaults<NDIM>::initial_level;

     template <std::size_t NDIM> int FunctionDefaults<NDIM>::max_refine_level;

     template <std::size_t NDIM> int FunctionDefaults<NDIM>::truncate_mode;

     template <std::size_t NDIM> bool FunctionDefaults<NDIM>::refine;

     template <std::size_t NDIM> bool FunctionDefaults<NDIM>::autorefine;

     template <std::size_t NDIM> bool FunctionDefaults<NDIM>::debug;

     template <std::size_t NDIM> bool FunctionDefaults<NDIM>::truncate_on_project;

     template <std::size_t NDIM> bool FunctionDefaults<NDIM>::apply_randomize;

     template <std::size_t NDIM> bool FunctionDefaults<NDIM>::project_randomize;

     template <std::size_t NDIM> BoundaryConditions<NDIM> FunctionDefaults<NDIM>::bc;

     template <std::size_t NDIM> TensorType FunctionDefaults<NDIM>::tt;

     template <std::size_t NDIM> Tensor<double> FunctionDefaults<NDIM>::cell;

     template <std::size_t NDIM> Tensor<double> FunctionDefaults<NDIM>::cell_width;

     template <std::size_t NDIM> Tensor<double> FunctionDefaults<NDIM>::rcell_width;

     template <std::size_t NDIM> double FunctionDefaults<NDIM>::cell_volume;

     template <std::size_t NDIM> double FunctionDefaults<NDIM>::cell_min_width;

     template <std::size_t NDIM> std::shared_ptr< WorldDCPmapInterface< Key<NDIM> > > FunctionDefaults<NDIM>::pmap;


     template <std::size_t NDIM> std::vector< Key<NDIM> > Displacements<NDIM>::disp;

     template <std::size_t NDIM> std::vector< Key<NDIM> > Displacements<NDIM>::disp_periodicsum[64];


 }


 #endif // MADNESS_MRA_MRAIMPL_H__INCLUDED

np
int np
Definition: tdse1d.cc:166

madness::FunctionNode::is_leaf
bool is_leaf() const
Returns true if this does not have children.
Definition: funcimpl.h:202

thresh
const double thresh
Definition: dielectric.cc:185

madness::error
void error(const char *msg)
Definition: world.cc:128

madness::World::gop
WorldGopInterface & gop
Global operations.
Definition: worldfwd.h:462

madness::GenTensor::config
SRConf< T > config() const
Definition: gentensor.h:201

madness::detail::noop::operator()
void operator()(const A &a, const B &b) const
Definition: mraimpl.h:2902

ttt
double ttt
Definition: eigen_solver.cc:182

B
Tensor< double > B
Definition: tdse1d.cc:167

madness::FunctionImpl::sum_down_spawn
Void sum_down_spawn(const keyT &key, const coeffT &s)
is this the same as trickle_down() ?
Definition: mraimpl.h:964

madness::tr1::shptr::shared_ptr
Definition: shared_ptr_bits.h:38

madness::FunctionNode::size
size_t size() const
Returns the number of coefficients in this node.
Definition: funcimpl.h:231

madness::WorldContainer< keyT, nodeT >

madness::reconstruct
void reconstruct(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Reconstruct a vector of functions.
Definition: vmra.h:149

madness::g
NDIM const Function< R, NDIM > & g
Definition: mra.h:2179

madness::FunctionNode::set_coeff
void set_coeff(const coeffT &coeffs)
Takes a shallow copy of the coeff — same as this->coeff()=coeff.
Definition: funcimpl.h:274

madness::FunctionImpl::sock_it_to_me_too
Void sock_it_to_me_too(const keyT &key, const RemoteReference< FutureImpl< std::pair< keyT, coeffT > > > &ref) const
Definition: mraimpl.h:2704

madness::norm
T norm(Vector< T, N > v)
Compute norm of a Vector.
Definition: array.h:447

madness::FunctionCommonData::_init_quadrature
static void _init_quadrature(int k, int npt, Tensor< double > &quad_x, Tensor< double > &quad_w, Tensor< double > &quad_phi, Tensor< double > &quad_phiw, Tensor< double > &quad_phit)
Initialize the quadrature information.
Definition: mraimpl.h:83

madness::DerivativeBase::find_neighbor
Future< argT > find_neighbor(const implT *f, const Key< NDIM > &key, int step) const
Definition: derivative.h:250

double_complex
std::complex< double > double_complex
Definition: lineplot.cc:16

madness::LevelPmap
A pmap that locates children on odd levels with their even level parents.
Definition: funcimpl.h:104

madness::GenTensor::full_tensor_copy
GenTensor< T > full_tensor_copy() const
Definition: gentensor.h:184

madness::FunctionImpl::get_thresh
double get_thresh() const
Definition: mraimpl.h:281

madness::FunctionImpl::print_plane
void print_plane(const std::string filename, const int xaxis, const int yaxis, const coordT &el2)
Print a plane ("xy", "xz", or "yz") containing the point x to file.
Definition: mraimpl.h:357

madness::FunctionImpl::do_print_tree
void do_print_tree(const keyT &key, std::ostream &os, Level maxlevel) const
Definition: mraimpl.h:2592

madness::TaskAttributes::hipri
static TaskAttributes hipri()
Definition: worldthread.h:277

madness::FunctionDefaults
FunctionDefaults holds default paramaters as static class members.
Definition: funcdefaults.h:175

madness::FunctionImpl::compress_op
coeffT compress_op(const keyT &key, const std::vector< Future< coeffT > > &v, bool nonstandard, bool redundant)
calculate the wavelet coefficients using the sum coefficients of all child nodes
Definition: mraimpl.h:1650

madness::FunctionImpl::plot_cube_kernel
Void plot_cube_kernel(archive::archive_ptr< Tensor< T > > ptr, const keyT &key, const coordT &plotlo, const coordT &plothi, const std::vector< long > &npt, bool eval_refine) const
Definition: mraimpl.h:3097

madness::FunctionImpl::multiply
Void multiply(const implT *f, const FunctionImpl< T, LDIM > *g, const int particle)
multiply f (a pair function of NDIM) with an orbital g (LDIM=NDIM/2)
Definition: funcimpl.h:3018

madness::TensorType
TensorType
low rank representations of tensors (see gentensor.h)
Definition: tensor.h:275

madness::FunctionImpl::insert_zero_down_to_initial_level
void insert_zero_down_to_initial_level(const keyT &key)
Initialize nodes to zero function at initial_level of refinement.
Definition: mraimpl.h:2488

madness::FunctionDefaults::get_cell_min_width
static double get_cell_min_width()
Returns the minimum width of any user cell dimension.
Definition: funcdefaults.h:401

madness::FunctionNode::has_children
bool has_children() const
Returns true if this node has children.
Definition: funcimpl.h:196

madness::FunctionImpl::size
std::size_t size() const
Returns the number of coefficients in the function ... collective global sum.
Definition: mraimpl.h:1829

madness::Key::translation
const Vector< Translation, NDIM > & translation() const
Definition: key.h:225

madness::FunctionImpl::abs_inplace
void abs_inplace(bool fence)
Definition: mraimpl.h:2958

madness::Hash_private::HashAccessor
Definition: worldhashmap.h:332

NDIM
const int NDIM
Definition: tdse1.cc:44

mpfr::mpreal::sum
friend const mpreal sum(const mpreal tab[], unsigned long int n, mp_rnd_t rnd_mode=mpreal::default_rnd)
Definition: mpreal.cc:241

function_common_data.h

madness::FunctionImpl::do_err_box
Definition: funcimpl.h:4544

madness::Vector< double, NDIM >

madness::GenTensor::has_no_data
bool has_no_data() const
Definition: gentensor.h:188

debug
const bool debug
Definition: tdse1.cc:45

madness::FunctionImpl::square_inplace
void square_inplace(bool fence)
Pointwise squaring of function with optional global fence.
Definition: mraimpl.h:2952

mpfr::dim
const mpreal dim(const mpreal &a, const mpreal &b, mp_rnd_t rnd_mode)
Definition: mpreal.h:2201

madness::FunctionNode::coeff
coeffT & coeff()
Returns a non-const reference to the tensor containing the coeffs.
Definition: funcimpl.h:216

madness::FunctionDefaults::set_defaults
static void set_defaults(World &world)
Used to set defaults to k=7, thresh=1-5, for a unit cube [0,1].
Definition: mraimpl.h:3309

madness::FunctionImpl::parent_to_child_NS
coeffT parent_to_child_NS(const keyT &child, const keyT &parent, const coeffT &coeff) const
Directly project parent NS coeffs to child NS coeffs.
Definition: mraimpl.h:658

madness::FunctionImpl::is_compressed
bool is_compressed() const
Returns true if the function is compressed.
Definition: mraimpl.h:231

L
const double L
Definition: 3dharmonic.cc:123

madness::FunctionImpl::phi_for_mul
void phi_for_mul(Level np, Translation lp, Level nc, Translation lc, Tensor< double > &phi) const
Compute the Legendre scaling functions for multiplication.
Definition: mraimpl.h:2968

madness::FunctionImpl::max_nodes
std::size_t max_nodes() const
Returns the max number of nodes on a processor.
Definition: mraimpl.h:1802

madness::ref
detail::ReferenceWrapper< T > const ref(T &t)
Reference wrapper factory function.
Definition: ref.h:132

madness::plotdx
void plotdx(const Function< T, NDIM > &f, const char *filename, const Tensor< double > &cell=FunctionDefaults< NDIM >::get_cell(), const std::vector< long > &npt=std::vector< long >(NDIM, 201L), bool binary=true)
Writes an OpenDX format file with a cube/slice of points on a uniform grid.
Definition: mraimpl.h:3228

madness::detail::squareinplace
Definition: mraimpl.h:2925

madness::FunctionImpl::max_depth
std::size_t max_depth() const
Returns the maximum depth of the tree ... collective ... global sum/broadcast.
Definition: mraimpl.h:1794

testing::internal::string
::std::string string
Definition: gtest-port.h:872

madness::FunctionImpl::remove_internal_coeffs
Definition: funcimpl.h:1948

madness::detail::scaleinplace::operator()
void operator()(const Key< NDIM > &key, FunctionNode< T, NDIM > &node) const
Definition: mraimpl.h:2916

madness::WorldContainerIterator
Iterator for distributed container wraps the local iterator.
Definition: worlddc.h:159

madness::FunctionImpl::abs_square_inplace
void abs_square_inplace(bool fence)
Definition: mraimpl.h:2963

madness::detail::abssquareinplace::operator()
void operator()(const Key< NDIM > &key, Tensor< T > &t) const
Definition: mraimpl.h:2940

madness::DerivativeBase::do_diff1
Void do_diff1(const implT *f, implT *df, const keyT &key, const argT &left, const argT &center, const argT &right) const
Definition: derivative.h:146

madness::FunctionImpl::do_diff1
Void do_diff1(const DerivativeBase< T, NDIM > *D, const implT *f, const keyT &key, const std::pair< keyT, coeffT > &left, const std::pair< keyT, coeffT > &center, const std::pair< keyT, coeffT > &right)
Definition: mraimpl.h:1023

madness::FunctionImpl::compress
void compress(bool nonstandard, bool keepleaves, bool redundant, bool fence)
compress the wave function
Definition: mraimpl.h:1462

madness::FunctionNode::has_coeff
bool has_coeff() const
Returns true if there are coefficients in this node.
Definition: funcimpl.h:188

madness::FunctionImpl::downsample
tensorT downsample(const keyT &key, const std::vector< Future< coeffT > > &v) const
downsample the sum coefficients of level n+1 to sum coeffs on level n
Definition: mraimpl.h:1237

madness::FunctionImpl::set_functor
void set_functor(const std::shared_ptr< FunctionFunctorInterface< T, NDIM > > functor1)
Definition: mraimpl.h:245

madness::FunctionImpl::truncate_reconstructed_op
coeffT truncate_reconstructed_op(const keyT &key, const std::vector< Future< coeffT > > &v, const double tol)
given the sum coefficients of all children, truncate or not
Definition: mraimpl.h:1584

madness::FunctionImpl::add_scalar_inplace
void add_scalar_inplace(T t, bool fence)
Adds a constant to the function. Local operation, optional fence.
Definition: mraimpl.h:2447

madness::FunctionImpl::norm_tree_op
double norm_tree_op(const keyT &key, const std::vector< Future< double > > &v)
Definition: mraimpl.h:1522

madness::nonstandard
void nonstandard(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Generates non-standard form of a vector of functions.
Definition: vmra.h:167

madness::FunctionImpl::real_size
std::size_t real_size() const
Returns the number of coefficients in the function ... collective global sum.
Definition: mraimpl.h:1860

madness::FunctionImpl::get_norm_tree_recursive
Future< double > get_norm_tree_recursive(const keyT &key) const
Definition: mraimpl.h:2667

madness::FunctionImpl::local_leaf_keys
std::vector< keyT > local_leaf_keys() const
return the keys of the local leaf boxes
Definition: mraimpl.h:515

madness::insert_op
Definition: funcimpl.h:684

madness::legendre_scaling_functions
void legendre_scaling_functions(double x, long k, double *p)
Evaluate the first k Legendre scaling functions.
Definition: legendre.cc:90

madness::detail::abssquareinplace
Definition: mraimpl.h:2939

madness::FunctionImpl::trickle_down
void trickle_down(bool fence)
sum all the contributions from all scales after applying an operator in mod-NS form ...
Definition: mraimpl.h:1388

madness::f
NDIM & f
Definition: mra.h:2179

madness::BaseTensor::dim
long dim(int i) const
Returns the size of dmension i.
Definition: basetensor.h:147

madness::FunctionImpl::min_nodes
std::size_t min_nodes() const
Returns the min number of nodes on a processor.
Definition: mraimpl.h:1811

madness::GenTensor::has_data
bool has_data() const
Definition: gentensor.h:187

madness::WorldContainer::end
iterator end()
Returns an iterator past the end of the local data (no communication)
Definition: worlddc.h:835

simpt2key
Key< 6 > simpt2key(const Vector< double, 6 > &pt, Level n)
Returns the box at level n that contains the given point in simulation coordinates.
Definition: helium_mp2.cc:475

madness::fcube
Tensor< T > fcube(const Key< NDIM > &, T(*f)(const Vector< double, NDIM > &), const Tensor< double > &)
Definition: mraimpl.h:2047

madness::FunctionImpl::do_average
"put" this on g
Definition: funcimpl.h:2152

madness::archive::archive_ptr
Wrapper for opaque pointer ... bitwise copy of the pointer ... no remapping performed.
Definition: archive.h:788

madness::FunctionImpl::get_cdata
const FunctionCommonData< T, NDIM > & get_cdata() const
Definition: mraimpl.h:302

madness::coordT
Vector< double, 3 > coordT
Definition: chem/corepotential.cc:57

madness::FunctionImpl::average
void average(const implT &rhs)
take the average of two functions, similar to: this=0.5*(this+rhs)
Definition: mraimpl.h:1150

madness::FunctionImpl::tensorT
Tensor< T > tensorT
Type of tensor for anything but to hold coeffs.
Definition: funcimpl.h:904

madness::FunctionImpl::get_k
int get_k() const
Definition: mraimpl.h:293

madness::FunctionImpl::child_patch
std::vector< Slice > child_patch(const keyT &child) const
Returns patch referring to coeffs of child in parent box.
Definition: mraimpl.h:641

madness::FunctionImpl::change_tensor_type1
void change_tensor_type1(const TensorArgs &targs, bool fence)
change the tensor type of the coefficients in the FunctionNode
Definition: mraimpl.h:1161

madness::FunctionImpl::parent_to_child
const coeffT parent_to_child(const coeffT &s, const keyT &parent, const keyT &child) const
Directly project parent coeffs to child coeffs.
Definition: mraimpl.h:2983

beta
const double beta
Definition: gygi_soltion.cc:63

madness::FunctionImpl
FunctionImpl holds all Function state to facilitate shallow copy semantics.
Definition: funcdefaults.h:48

madness::FunctionDefaults::get_cell
static const Tensor< double > & get_cell()
Gets the user cell for the simulation.
Definition: funcdefaults.h:369

madness::Key::is_invalid
bool is_invalid() const
Checks if a key is invalid.
Definition: key.h:152

madness::detail::squareinplace::serialize
void serialize(Archive &ar)
Definition: mraimpl.h:2929

PROFILE_MEMBER_FUNC
#define PROFILE_MEMBER_FUNC(classname)
Definition: worldprofile.h:199

madness::WorldContainer::begin
iterator begin()
Returns an iterator to the beginning of the local data (no communication)
Definition: worlddc.h:822

madness::detail::scaleinplace::scaleinplace
scaleinplace()
Definition: mraimpl.h:2910

madness::FunctionImpl::do_standard
Changes non-standard compressed form to standard compressed form.
Definition: funcimpl.h:3895

madness::FunctionImpl::find_me
Future< std::pair< keyT, coeffT > > find_me(const keyT &key) const
find_me. Called by diff_bdry to get coefficients of boundary function
Definition: mraimpl.h:3059

madness::FunctionImpl::trickle_down_op
Void trickle_down_op(const keyT &key, const coeffT &s)
sum all the contributions from all scales after applying an operator in mod-NS form ...
Definition: mraimpl.h:1402

funcimpl.h
Provides FunctionCommonData, FunctionImpl and FunctionFactory.

madness::detail::scaleinplace::q
T q
Definition: mraimpl.h:2909

madness::FunctionNode::set_norm_tree
Void set_norm_tree(double norm_tree)
Sets the value of norm_tree.
Definition: funcimpl.h:295

madness::FunctionDefaults::get_bc
static const BoundaryConditions< NDIM > & get_bc()
Returns the default boundary conditions.
Definition: funcdefaults.h:345

madness::FunctionImpl::get_tensor_type
TensorType get_tensor_type() const
Definition: mraimpl.h:275

madness::FunctionImpl::scale_inplace
void scale_inplace(const T q, bool fence)
In-place scale by a constant.
Definition: mraimpl.h:2946

madness::Key::is_valid
bool is_valid() const
Checks if a key is valid.
Definition: key.h:158

madness::FunctionImpl::noautorefine
bool noautorefine(const keyT &key, const tensorT &t) const
Always returns false (for when autorefine is not wanted)
Definition: mraimpl.h:947

madness::FunctionImpl::set_autorefine
void set_autorefine(bool value)
Definition: mraimpl.h:290

madness::CoeffTracker
a class to track where relevant (parent) coeffs are
Definition: funcimpl.h:756

madness::FunctionImpl::max_local_depth
std::size_t max_local_depth() const
Returns the maximum local depth of the tree ... no communications.
Definition: mraimpl.h:1780

madness::Key::thisKeyContains
bool thisKeyContains(const Vector< double, NDIM > &x, const unsigned int &dim0, const unsigned int &dim1) const
check if this MultiIndex contains point x, disregarding these two dimensions
Definition: key.h:306

madness::FunctionImpl::erase
Void erase(const Level &max_level)
truncate tree at a certain level
Definition: mraimpl.h:823

madness::FunctionImpl::do_print_tree_graphviz
void do_print_tree_graphviz(const keyT &key, std::ostream &os, Level maxlevel) const
Definition: mraimpl.h:2620

madness::TensorArgs::thresh
double thresh
Definition: gentensor.h:128

madness::RemoteReference
Simple structure used to manage references/pointers to remote instances.
Definition: worldref.h:59

PROFILE_BLOCK
#define PROFILE_BLOCK(name)
Definition: worldprofile.h:197

madness::FunctionImpl::do_consolidate_buffer
Definition: funcimpl.h:2206

madness::FunctionImpl::do_truncate_NS_leafs
given an NS tree resulting from a convolution, truncate leafs if appropriate
Definition: funcimpl.h:1922

madness::FunctionImpl::sock_it_to_me
Void sock_it_to_me(const keyT &key, const RemoteReference< FutureImpl< std::pair< keyT, coeffT > > > &ref) const
Walk up the tree returning pair(key,node) for first node with coefficients.
Definition: mraimpl.h:2678

madness::FunctionImpl::evaldepthpt
Void evaldepthpt(const Vector< double, NDIM > &xin, const keyT &keyin, const typename Future< Level >::remote_refT &ref)
Get the depth of the tree at a point in simulation coordinates.
Definition: mraimpl.h:2800

madness::FunctionImpl::zero_norm_tree
void zero_norm_tree()
Definition: mraimpl.h:1329

madness::FunctionImpl::truncate_reconstructed_spawn
Future< coeffT > truncate_reconstructed_spawn(const keyT &key, const double tol)
truncate using a tree in reconstructed form
Definition: mraimpl.h:1560

madness::FunctionImpl::print_tree_graphviz
void print_tree_graphviz(std::ostream &os=std::cout, Level maxlevel=10000) const
Definition: mraimpl.h:2612

madness::Future::get
T & get()
Gets the value, waiting if necessary (error if not a local future)
Definition: worldfut.h:513

madness::FunctionImpl::do_print_grid
void do_print_grid(const std::string filename, const std::vector< keyT > &keys) const
print the grid in xyz format
Definition: mraimpl.h:541

std::tr1::T
const T1 &f1 return GTEST_2_TUPLE_() T(f0, f1)

madness::FunctionImpl::find_datum
std::pair< Key< NDIM >, ShallowNode< T, NDIM > > find_datum(keyT key) const
return the a std::pair, which MUST exist
Definition: mraimpl.h:1057

madness::FunctionImpl::verify_tree
void verify_tree() const
Verify tree is properly constructed ... global synchronization involved.
Definition: mraimpl.h:104

max
#define max(a, b)
Definition: lda.h:53

madness::vec
Vector< T, 1 > vec(T x)
Your friendly neighborhood factory function.
Definition: array.h:456

madness::FunctionImpl::print_plane_local
Tensor< double > print_plane_local(const int xaxis, const int yaxis, const coordT &el2)
collect the data for a plot of the MRA structure locally on each node
Definition: mraimpl.h:378

madness::Key::parent
Key parent(int generation=1) const
Returns the key of the parent.
Definition: key.h:248

madness::scale
void scale(World &world, std::vector< Function< T, NDIM > > &v, const std::vector< Q > &factors, bool fence=true)
Scales inplace a vector of functions by distinct values.
Definition: vmra.h:290

madness::detail::absinplace::serialize
void serialize(Archive &ar)
Definition: mraimpl.h:2935

madness::DerivativeBase::forward_do_diff1
Void forward_do_diff1(const implT *f, implT *df, const keyT &key, const argT &left, const argT &center, const argT &right) const
Definition: derivative.h:109

madness::change_tensor_type
void change_tensor_type(GenTensor< T > &t, const TensorArgs &targs)
change representation to targ.tt
Definition: gentensor.h:1309

madness::BoundaryConditions::is_periodic
std::vector< bool > is_periodic() const
Convenience for application of integral operators.
Definition: funcdefaults.h:137

madness::FunctionImpl::eval_local_only
std::pair< bool, T > eval_local_only(const Vector< double, NDIM > &xin, Level maxlevel)
Evaluate function only if point is local returning (true,value); otherwise return (false...
Definition: mraimpl.h:2771

madness::FunctionImpl::key0
const keyT & key0() const
Definition: mraimpl.h:348

madness::copy
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence. ...
Definition: mra.h:1835

madness::FunctionImpl::gaxpy_oop_reconstructed
void gaxpy_oop_reconstructed(const double alpha, const implT &f, const double beta, const implT &g, const bool fence)
perform: this= alpha*f + beta*g, invoked by result
Definition: mraimpl.h:203

mpfr::min
const mpreal min(const mpreal &x, const mpreal &y)
Definition: mpreal.h:2675

N
const double N
Definition: navstokes_cosines.cc:94

madness::FunctionImpl::do_change_tensor_type
change representation of nodes' coeffs to low rank, optional fence
Definition: funcimpl.h:2185

madness::FunctionImpl::make_redundant_op
coeffT make_redundant_op(const keyT &key, const std::vector< Future< coeffT > > &v)
similar to compress_op, but insert only the sum coefficients in the tree
Definition: mraimpl.h:1714

a
FLOAT a(int j, FLOAT z)
Definition: y1.cc:86

madness::FunctionImpl::reset_timer
void reset_timer()
Definition: mraimpl.h:320

madness::FunctionImpl::print_grid
void print_grid(const std::string filename) const
Definition: mraimpl.h:499

madness::BoundaryConditions
This class is used to specify boundary conditions for all operatorsExterior boundary conditions (i...
Definition: funcdefaults.h:72

madness::gauss_legendre
bool gauss_legendre(int n, double xlo, double xhi, double *x, double *w)
Definition: legendre.cc:231

madness::Key::level
Level level() const
Definition: key.h:220

madness::GenTensor::reduce_rank
void reduce_rank(const double &eps)
Definition: gentensor.h:193

mu
const double mu
Definition: navstokes_cosines.cc:96

madness::FunctionImpl::upsample
coeffT upsample(const keyT &key, const coeffT &coeff) const
upsample the sum coefficients of level 1 to sum coeffs on level n+1
Definition: mraimpl.h:1267

madness::FunctionImpl::print_tree
void print_tree(std::ostream &os=std::cout, Level maxlevel=10000) const
Definition: mraimpl.h:2583

madness::tensorT
Tensor< double > tensorT
Definition: chem/distpm.cc:13

madness::FunctionImpl::truncate
void truncate(double tol, bool fence)
Truncate according to the threshold with optional global fence.
Definition: mraimpl.h:332

madness::TensorArgs
TensorArgs holds the arguments for creating a LowRankTensor.
Definition: gentensor.h:127

madness::FunctionImpl::reconstruct_op
Void reconstruct_op(const keyT &key, const coeffT &s)
Definition: mraimpl.h:1992

madness::FunctionImpl::check_symmetry_local
double check_symmetry_local() const
Returns some asymmetry measure ... no comms.
Definition: mraimpl.h:840

madness::detail::scaleinplace
Definition: mraimpl.h:2908

madness::FunctionImpl::evalR
Void evalR(const Vector< double, NDIM > &xin, const keyT &keyin, const typename Future< long >::remote_refT &ref)
Get the rank of leaf box of the tree at a point in simulation coordinates.
Definition: mraimpl.h:2842

mu
Namespace for mathematical applications.
Definition: muParser.cpp:47

madness::TT_2D
Definition: tensor.h:275

madness::ShallowNode
shallow-copy, pared-down version of FunctionNode, for special purpose only
Definition: funcimpl.h:717

madness::FunctionImpl::broaden
void broaden(std::vector< bool > is_periodic, bool fence)
Definition: mraimpl.h:1338

madness::FutureImpl
Implements the functionality of Futures.
Definition: worldfut.h:157

madness::FunctionImpl::flo_unary_op_node_inplace
void flo_unary_op_node_inplace(const opT &op, bool fence)
Unary operation applied inplace to the coefficients WITHOUT refinement, optional fence.
Definition: funcimpl.h:1897

madness::FunctionImpl::do_mapdim
map this on f
Definition: funcimpl.h:2122

madness::TaskAttributes::generator
static TaskAttributes generator()
Definition: worldthread.h:273

madness::FunctionImpl::truncate_op
bool truncate_op(const keyT &key, double tol, const std::vector< Future< bool > > &v)
Actually do the truncate operation.
Definition: mraimpl.h:2555

madness::ElementaryInterface
ElementaryInterface (formerly FunctorInterfaceWrapper) interfaces a c-function.
Definition: function_interface.h:207

madness::FunctionImpl::is_on_demand
bool & is_on_demand()
Definition: mraimpl.h:269

worldobj.h
Defines and implements WorldObject.

madness::standard
void standard(World &world, std::vector< Function< T, NDIM > > &v, bool fence=true)
Generates standard form of a vector of functions.
Definition: vmra.h:181

madness::FunctionImpl::set_thresh
void set_thresh(double value)
Definition: mraimpl.h:284

madness::FunctionImpl::is_nonstandard
bool is_nonstandard() const
Definition: mraimpl.h:242

sqrt
tensorT sqrt(const tensorT &s, double tol=1e-8)
Computes matrix square root (not used any more?)
Definition: DFcode/moldft.cc:446

madness::World
A parallel world with full functionality wrapping an MPI communicator.
Definition: worldfwd.h:416

madness::WorldGopInterface::fence
void fence()
Synchronizes all processes in communicator AND globally ensures no pending AM or tasks.
Definition: worldgop.cc:52

madness::GenTensor::tensor_type
TensorType tensor_type() const
Definition: gentensor.h:197

madness::FunctionImpl::get_functor
std::shared_ptr< FunctionFunctorInterface< T, NDIM > > get_functor()
Definition: mraimpl.h:251

madness::FunctionImpl::reduce_rank
void reduce_rank(const TensorArgs &targs, bool fence)
reduce the rank of the coefficients tensors
Definition: mraimpl.h:1169

mpfr::round
const mpreal round(const mpreal &v)
Definition: mpreal.h:2611

madness::FunctionImpl::reconstruct
void reconstruct(bool fence)
Definition: mraimpl.h:1444

madness::FunctionImpl::project_refine_op
Void project_refine_op(const keyT &key, bool do_refine, const std::vector< Vector< double, NDIM > > &specialpts)
Projection with optional refinement.
Definition: mraimpl.h:2368

madness::Function
A multiresolution adaptive numerical function.
Definition: derivative.h:61

madness::Level
int Level
Definition: key.h:58

madness::detail::scaleinplace::serialize
void serialize(Archive &ar)
Definition: mraimpl.h:2919

ProcessID
int ProcessID
Used to clearly identify process number/rank.
Definition: worldtypes.h:37

madness::ScopedArray
Scoped array.
Definition: scopedptr.h:85

madness::FunctionImpl::trace_local
T trace_local() const
Returns int(f(x),x) in local volume.
Definition: mraimpl.h:3000

madness::FunctionImpl::true_refine_test
Definition: funcimpl.h:3757

madness::FunctionImpl::print_size
void print_size(const std::string name) const
print tree size and size
Definition: mraimpl.h:1874

mpfr::sum
const mpreal sum(const mpreal tab[], unsigned long int n, mp_rnd_t rnd_mode)
Definition: mpreal.cc:241

madness::detail::noop::serialize
void serialize(Archive &ar)
Definition: mraimpl.h:2904

madness::FunctionNode
FunctionNode holds the coefficients, etc., at each node of the 2^NDIM-tree.
Definition: derivative.h:58

madness::DerivativeBase
Tri-diagonal operator traversing tree primarily for derivative operator.
Definition: derivative.h:73

madness::FunctionFunctorInterface
Abstract base class interface required for functors used as input to Functions.
Definition: function_interface.h:58

m
const double m
Definition: gfit.cc:199

madness::FunctionImpl::eval_plot_cube
Tensor< T > eval_plot_cube(const coordT &plotlo, const coordT &plothi, const std::vector< long > &npt, const bool eval_refine=false) const
Evaluate a cube/slice of points ... plotlo and plothi are already in simulation coordinates.
Definition: mraimpl.h:3192

madness::World::rank
ProcessID rank() const
Returns the process rank in this world (same as MPI_Comm_rank()))
Definition: worldfwd.h:526

madness::FunctionImpl::accumulate_timer
Void accumulate_timer(const double time) const
Definition: mraimpl.h:305

madness::FunctionImpl::do_check_symmetry_local
check symmetry wrt particle exchange
Definition: funcimpl.h:2012

madness::FunctionImpl::finalize_apply
double finalize_apply(const bool fence=true)
after apply we need to do some cleanup;
Definition: mraimpl.h:1741

madness::FunctionImpl::norm_tree
void norm_tree(bool fence)
compute for each FunctionNode the norm of the function inside that node
Definition: mraimpl.h:1514

madness::FunctionNode::set_has_children
Void set_has_children(bool flag)
Sets has_children attribute to value of flag.
Definition: funcimpl.h:244

madness::FunctionImpl::print_stats
void print_stats() const
print the number of configurations per node
Definition: mraimpl.h:1898

madness::GenTensor::full_tensor
GenTensor< T > full_tensor() const
Definition: gentensor.h:182

test
void test(World &world, bool doloadbal=false)
Definition: dataloadbal.cc:225

madness::FunctionImpl::broaden_op
Void broaden_op(const keyT &key, const std::vector< Future< bool > > &v)
Definition: mraimpl.h:1317

madness::FunctionImpl::is_redundant
bool is_redundant() const
Returns true if the function is redundant.
Definition: mraimpl.h:237

madness::general_transform
GenTensor< TENSOR_RESULT_TYPE(T, Q)> general_transform(const GenTensor< T > &t, const Tensor< Q > c[])
Transform all dimensions of the tensor t by distinct matrices c.
Definition: gentensor.h:1342

madness::FunctionImpl::do_convert_to_color
Definition: funcimpl.h:1250

madness::abs
double abs(double x)
Definition: complexfun.h:48

madness::Key::is_neighbor_of
bool is_neighbor_of(const Key &key, const std::vector< bool > &bperiodic) const
Assuming keys are at the same level, returns true if displaced by no more than 1 in any direction...
Definition: key.h:283

madness::FunctionImpl::tree_size
std::size_t tree_size() const
Returns the size of the tree structure of the function ... collective global sum. ...
Definition: mraimpl.h:1820

madness::Future::remote_ref
remote_refT remote_ref(World &world) const
Returns a structure used to pass references to another process.
Definition: worldfut.h:552

madness::Range
Range vaguely a la Intel TBB encapsulates random-access STL-like start and end iterators with chunksi...
Definition: worldrange.h:49

madness::FunctionImpl::get_pmap
const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > & get_pmap() const
Definition: mraimpl.h:187

madness::FunctionNode::clear_coeff
void clear_coeff()
Clears the coefficients (has_coeff() will subsequently return false)
Definition: funcimpl.h:284

madness::BaseTensor::size
long size() const
Returns the number of elements in the tensor.
Definition: basetensor.h:138

madness::FunctionImpl::diff
void diff(const DerivativeBase< T, NDIM > *D, const implT *f, bool fence)
Definition: mraimpl.h:1035

madness::FunctionImpl::truncate_spawn
Future< bool > truncate_spawn(const keyT &key, double tol)
Returns true if after truncation this node has coefficients.
Definition: mraimpl.h:2519

madness::FunctionDefaults::get_cell_width
static const Tensor< double > & get_cell_width()
Returns the width of each user cell dimension.
Definition: funcdefaults.h:391

madness::FunctionImpl::standard
void standard(bool fence)
Changes non-standard compressed form to standard compressed form.
Definition: mraimpl.h:1732

worlddc.h
Implements WorldContainer.

madness::FunctionImpl::simpt2key
Key< NDIM > simpt2key(const coordT &pt, Level n) const
Returns the box at level n that contains the given point in simulation coordinates.
Definition: mraimpl.h:694

madness::GenTensor::real_size
size_t real_size() const
Definition: gentensor.h:191

madness::Future
A future is a possibly yet unevaluated value.
Definition: ref.h:210

madness::Void
A type you can return when you want to return void ... use "return None".
Definition: typestuff.h:154

madness::FunctionImpl::fcube
void fcube(const keyT &key, const FunctionFunctorInterface< T, NDIM > &f, const Tensor< double > &qx, tensorT &fval) const
Evaluate function at quadrature points in the specified box.
Definition: mraimpl.h:2356

madness::FunctionImpl::exists_and_has_children
bool exists_and_has_children(const keyT &key) const
Definition: mraimpl.h:1306

madness::FunctionImpl::coeffs_for_jun
tensorT coeffs_for_jun(Level n, long q=0)
Get the scaling function coeffs at level n starting from NS form.
Definition: mraimpl.h:708

madness::fast_transform
Tensor< TENSOR_RESULT_TYPE(T, Q) > & fast_transform(const Tensor< T > &t, const Tensor< Q > &c, Tensor< TENSOR_RESULT_TYPE(T, Q) > &result, Tensor< TENSOR_RESULT_TYPE(T, Q) > &workspace)
Restricted but heavily optimized form of transform()
Definition: tensor.h:2351

madness::transpose
Tensor< T > transpose(const Tensor< T > &t)
Returns a new deep copy of the transpose of the input tensor.
Definition: tensor.h:1945

displacements.h

op
Tensor< double > op(const Tensor< double > &x)
Definition: kain.cc:508

madness::BC_FREE
Definition: funcdefaults.h:56

madness::print
void print(const A &a)
Print a single item to std::cout terminating with new line.
Definition: print.h:122

madness::FunctionCommonData
FunctionCommonData holds all Function data common for given k.
Definition: function_common_data.h:52

madness::project
Function< T, NDIM > project(const Function< T, NDIM > &other, int k=FunctionDefaults< NDIM >::get_k(), double thresh=FunctionDefaults< NDIM >::get_thresh(), bool fence=true)
Definition: mra.h:2162

madness::FunctionImpl::assemble_coefficients
coeffT assemble_coefficients(const keyT &key, const coeffT &coeff_ket, const coeffT &vpotential1, const coeffT &vpotential2, const tensorT &veri) const
given several coefficient tensors, assemble a result tensor
Definition: mraimpl.h:1099

MADNESS_EXCEPTION
#define MADNESS_EXCEPTION(msg, value)
Definition: worldexc.h:88

madness::FunctionFunctorInterface::screened
virtual bool screened(const Vector< double, NDIM > &c1, const Vector< double, NDIM > &c2) const
Can we screen this function based on the bounding box information?
Definition: function_interface.h:65

madness::FunctionImpl::filter
tensorT filter(const tensorT &s) const
Transform sum coefficients at level n to sums+differences at level n-1.
Definition: mraimpl.h:1188

madness::FunctionImpl::print_info
void print_info() const
Prints summary of data distribution.
Definition: mraimpl.h:921

madness::Slice
A slice defines a sub-range or patch of a dimension.
Definition: slice.h:103

madness::FunctionImpl::compress_spawn
Future< coeffT > compress_spawn(const keyT &key, bool nonstandard, bool keepleaves, bool redundant)
Definition: mraimpl.h:3070

madness::FunctionImpl::exists_and_is_leaf
bool exists_and_is_leaf(const keyT &key) const
Definition: mraimpl.h:1311

madness::FunctionImpl::do_print_plane
Void do_print_plane(const std::string filename, std::vector< Tensor< double > > plotinfo, const int xaxis, const int yaxis, const coordT el2)
print the MRA structure
Definition: mraimpl.h:454

madness::detail::squareinplace::operator()
void operator()(const Key< NDIM > &key, Tensor< T > &t) const
Definition: mraimpl.h:2926

madness::detail::absinplace::operator()
void operator()(const Key< NDIM > &key, Tensor< T > &t) const
Definition: mraimpl.h:2934

madness::detail::absinplace
Definition: mraimpl.h:2933

madness::GenTensor
Definition: gentensor.h:123

madness::FunctionImpl::norm_tree_spawn
Future< double > norm_tree_spawn(const keyT &key)
Definition: mraimpl.h:1537

madness::FunctionImpl::get_autorefine
bool get_autorefine() const
Definition: mraimpl.h:287

madness::IndexIterator
Definition: indexit.h:55

madness::FunctionImpl::autorefine_square_test
bool autorefine_square_test(const keyT &key, const nodeT &t) const
Returns true if this block of coeffs needs autorefining.
Definition: mraimpl.h:953

madness::Future::set
void set(const Future< T > &other)
A.set(B) where A & B are futures ensures A has/will have the same value as B.
Definition: worldfut.h:473

madness::TT_FULL
Definition: tensor.h:275

madness::FunctionImpl::undo_redundant
void undo_redundant(const bool fence)
convert this from redundant to standard reconstructed form
Definition: mraimpl.h:1504

madness::FunctionImpl::eval
Void eval(const Vector< double, NDIM > &xin, const keyT &keyin, const typename Future< T >::remote_refT &ref)
Evaluate the function at a point in simulation coordinates.
Definition: mraimpl.h:2727

madness::FunctionImpl::norm2sq_local
double norm2sq_local() const
Returns the square of the local norm ... no comms.
Definition: mraimpl.h:1768

madness::multiply
Function< T, NDIM > multiply(const Function< T, NDIM > f, const Function< T, LDIM > g, const int particle, const bool fence=true)
multiply a high-dimensional function with a low-dimensional function
Definition: mra.h:2116

madness::Translation
int64_t Translation
Definition: key.h:57

madness::two_scale_hg
bool two_scale_hg(int k, Tensor< double > *hg)
Definition: twoscale.cc:156

madness::detail::noop
Definition: mraimpl.h:2901

madness::FunctionImpl::do_reduce_rank
reduce the rank of the nodes, optional fence
Definition: funcimpl.h:1986

madness::FunctionImpl::add_op
add two functions f and g: result=alpha * f + beta * g
Definition: funcimpl.h:2956

madness::detail::scaleinplace::operator()
void operator()(const Key< NDIM > &key, Tensor< T > &t) const
Definition: mraimpl.h:2913

madness
Holds machinery to set up Functions/FuncImpls using various Factories and Interfaces.
Definition: chem/atomutil.cc:45

madness::FunctionImpl::get_coeffs
const dcT & get_coeffs() const
Definition: mraimpl.h:296

c
const double c
Definition: gfit.cc:200

madness::transform
std::vector< Function< TENSOR_RESULT_TYPE(T, R), NDIM > > transform(World &world, const std::vector< Function< T, NDIM > > &v, const DistributedMatrix< R > &c, bool fence=true)
Definition: chem/SCF.cc:86

b
FLOAT b(int j, FLOAT z)
Definition: y1.cc:79

madness::FunctionImpl::print_timer
void print_timer() const
Definition: mraimpl.h:311

madness::wall_time
double wall_time()
Returns the wall time in seconds relative to arbitrary origin.
Definition: world.cc:248

madness::FunctionImpl::do_norm2sq_local
Definition: funcimpl.h:4598

madness::Key
Key is the index for a node of the 2^NDIM-tree.
Definition: key.h:69

madness::FunctionImpl::unfilter
tensorT unfilter(const tensorT &s) const
Transform sums+differences at level n to sum coefficients at level n+1.
Definition: mraimpl.h:1217

madness::FunctionImpl::project
tensorT project(const keyT &key) const
Compute by projection the scaling function coeffs in specified box.
Definition: mraimpl.h:2646

madness::FunctionImpl::truncate_tol
double truncate_tol(double tol, const keyT &key) const
Returns the truncation threshold according to truncate_method.
Definition: mraimpl.h:613

madness::FunctionImpl::unset_functor
void unset_functor()
Definition: mraimpl.h:263

madness::FunctionImpl::get_tensor_args
TensorArgs get_tensor_args() const
Definition: mraimpl.h:278

madness::FunctionImpl::neighbor
keyT neighbor(const keyT &key, const keyT &disp, const std::vector< bool > &is_periodic) const
Returns key of general neighbor enforcing BC.
Definition: mraimpl.h:3042

madness::HighDimIndexIterator
Definition: indexit.h:141

madness::FunctionImpl::eval_cube
T eval_cube(Level n, coordT &x, const tensorT &c) const
Definition: mraimpl.h:1938

madness::FunctionFunctorInterface::supports_vectorized
virtual bool supports_vectorized() const
Does the interface support a vectorized operator()?
Definition: function_interface.h:70

PROFILE_FUNC
#define PROFILE_FUNC
Definition: worldprofile.h:198

madness::FunctionImpl::forward_do_diff1
Void forward_do_diff1(const DerivativeBase< T, NDIM > *D, const implT *f, const keyT &key, const std::pair< keyT, coeffT > &left, const std::pair< keyT, coeffT > &center, const std::pair< keyT, coeffT > &right)
Definition: mraimpl.h:1012

madness::TensorTypeData
Traits class to specify support of numeric types.
Definition: type_data.h:56

madness::FunctionImpl::tnorm
void tnorm(const tensorT &t, double *lo, double *hi) const
Computes norm of low/high-order polyn. coeffs for autorefinement test.
Definition: mraimpl.h:2885

madness::FunctionImpl::sum_down
void sum_down(bool fence)
After 1d push operator must sum coeffs down the tree to restore correct scaling function coefficients...
Definition: mraimpl.h:1004

worldhashmap.h
Defines and implements a concurrent hashmap.

madness::FunctionImpl::make_redundant
void make_redundant(const bool fence)
convert this to redundant, i.e. have sum coefficients on all levels
Definition: mraimpl.h:1485

madness::detail::scaleinplace::scaleinplace
scaleinplace(T q)
Definition: mraimpl.h:2912

madness::FunctionImpl::refine_to_common_level
Void refine_to_common_level(const std::vector< FunctionImpl< T, NDIM > * > &v, const std::vector< tensorT > &c, const keyT key)
Refine multiple functions down to the same finest level.
Definition: mraimpl.h:854

madness::compress
void compress(World &world, const std::vector< Function< T, NDIM > > &v, bool fence=true)
Compress a vector of functions.
Definition: vmra.h:130

madness::FunctionImpl::mapdim
void mapdim(const implT &f, const std::vector< long > &map, bool fence)
Permute the dimensions of f according to map, result on this.
Definition: mraimpl.h:1138

madness::GenTensor::rank
long rank() const
Definition: gentensor.h:189

madness::detail::abssquareinplace::serialize
void serialize(Archive &ar)
Definition: mraimpl.h:2941

madness::KeyChildIterator
Iterates in lexical order thru all children of a key.
Definition: key.h:61

madness::FunctionImpl::put_in_box
Void put_in_box(ProcessID from, long nl, long ni) const
Definition: mraimpl.h:911