ctf/scan_8cxx_source.html

 #include <ctf.hpp>
 #include <float.h>
 using namespace CTF;

 template <typename dtype>
 void rec_scan(Tensor<dtype> & V){

   if (V.order == 1){
     Matrix<dtype> W(2, V.lens[0], V.lens[0], *V.wrld, *V.sr);
     dtype mulid = ((dtype*)V.sr->mulid())[0];
     W["ij"], [=](dtype & a){ a=mulid; };
     int ssym[] = {SH, NS};
     int nsym[] = {NS, NS};
     Tensor<dtype> W1(W, ssym);
     Tensor<dtype> W2(W1, nsym);
     V["i"] = W2["ji"]*V["j"];
   } else {
     Tensor<dtype> V2(V.order-1, V.lens, *V.wrld, *V.sr);
     char str[V.order];
     for (int i=0; i<V.order; i++){ str[i] = 'a'+i; }
     V2[str+1] += V[str];
     rec_scan(V2);

     Matrix<dtype> W(2, V.lens[V.order-1], V.lens[V.order-1], *V.wrld, *V.sr);
     dtype mulid = ((dtype*)V.sr->mulid())[0];
     W["ij"], [=](dtype & a){ a=mulid; };
     int hsym[] = {SH, NS};
     int nsym[] = {NS, NS};
     Tensor<dtype> W1(W, hsym);
     Tensor<dtype> W2(W1, nsym);
     char str2[V.order];
     memcpy(str2+1, str+1, V.order-1);
     str2[0] = 'a'+V.order;
     char strW[2] = {str2[0],'a'};
     V[str]  = W2[strW]*V[str2];
     V[str] += V2[str+1];
   }
 }

 template<typename dtype>
 void scan(Vector<dtype> & v, int logn){
   int64_t np;
   int64_t * inds;
   double * data;

   int lens[logn];
   std::fill(lens, lens+logn, 2);

   // represent vector to scan as 2-by-...-by-2 tensor
   Tensor<dtype> V(logn, lens, *v.wrld, *v.sr);

   v.get_local_data(&np, &inds, &data);
   V.write(np, inds, data);

   free(inds);
   delete [] data;

   rec_scan(V);

   // put the data from the tensor back into the vector
   V.get_local_data(&np, &inds, &data);
   v.write(np, inds, data);

   free(inds);
   delete [] data;
 }

 int scan_test(int     logn,
               World & dw){

   Vector<> v(1<<logn, dw);

   srand48(dw.rank*27);
   v.fill_random(0.0, 1.0);

   double start_data[1<<logn];

   v.read_all(start_data);

   scan(v, logn);

   double data[1<<logn];

   v.read_all(data);

   int pass = 1;
   for (int i=1; i<1<<logn; i++){
     if (std::abs(data[i] - start_data[i-1] - data[i-1]) >= 1.E-9*(1<<logn)) pass = 0;
   }
   if (dw.rank == 0){
     if (pass)
       printf("{ scan via tensor contractions } passed \n");
     else
       printf("{ scan via tensor contractions } failed \n");
   }
   return pass;
 }


 #ifndef TEST_SUITE
 char* getCmdOption(char ** begin,
                    char ** end,
                    const   std::string & option){
   char ** itr = std::find(begin, end, option);
   if (itr != end && ++itr != end){
     return *itr;
   }
   return 0;
 }


 int main(int argc, char ** argv){
   int rank, np, logn, pass;
   int const in_num = argc;
   char ** input_str = argv;

   MPI_Init(&argc, &argv);
   MPI_Comm_rank(MPI_COMM_WORLD, &rank);
   MPI_Comm_size(MPI_COMM_WORLD, &np);

   if (getCmdOption(input_str, input_str+in_num, "-logn")){
     logn = atoi(getCmdOption(input_str, input_str+in_num, "-logn"));
     if (logn < 0) logn = 4;
   } else logn = 4;


   {
     World dw(argc, argv);

     if (rank == 0){
       printf("Running scan on dimension %d vector\n",1<<logn);
     }
     pass = scan_test(logn, dw);
     assert(pass);
   }

   MPI_Finalize();
   return 0;
 }
 #endif
ctf.hpp

CTF::Matrix
Matrix class which encapsulates a 2D tensor.
Definition: matrix.h:18

ctf.core.rank
def rank(self)
Definition: core.pyx:312

CTF::Vector
Vector class which encapsulates a 1D tensor.
Definition: vector.h:14

CTF::Tensor::read_all
void read_all(int64_t *npair, dtype **data, bool unpack=false)
collects the entire tensor data on each process (not memory scalable)
Definition: tensor.cxx:377

NS
Definition: common.h:37

getCmdOption
char * getCmdOption(char **begin, char **end, const std::string &option)
Definition: scan.cxx:108

CTF::World
an instance of the CTF library (world) on a MPI communicator
Definition: world.h:19

CTF_int::tensor::order
int order
number of tensor dimensions
Definition: untyped_tensor.h:76

ctf.core.string
string
Definition: core.pyx:456

CTF_int::tensor::wrld
CTF::World * wrld
distributed processor context on which tensor is defined
Definition: untyped_tensor.h:70

ctf.core.a
a
Definition: core.pyx:385

CTF::Tensor::fill_random
void fill_random(dtype rmin, dtype rmax)
fills local unique tensor elements to random values in the range [min,max] works only for dtype in {f...
Definition: tensor.cxx:928

CTF::World::rank
int rank
rank of local processor
Definition: world.h:24

CTF_int::tensor::lens
int * lens
unpadded tensor edge lengths
Definition: untyped_tensor.h:78

ctf.core.dtype
dtype
Definition: core.pyx:387

rec_scan
void rec_scan(Tensor< dtype > &V)
Definition: scan.cxx:13

CTF_int::tensor::sr
algstrct * sr
algstrct on which tensor elements and operations are defined
Definition: untyped_tensor.h:72

scan
void scan(Vector< dtype > &v, int logn)
Definition: scan.cxx:48

ctf.core.abs
def abs(initA)
Definition: core.pyx:5440

scan_test
int scan_test(int logn, World &dw)
Definition: scan.cxx:75

main
int main(int argc, char **argv)
Definition: scan.cxx:119

CTF::Tensor::get_local_data
void get_local_data(int64_t *npair, int64_t **global_idx, dtype **data, bool nonzeros_only=false, bool unpack_sym=false) const
Gives the global indices and values associated with the local data.
Definition: tensor.cxx:159

CTF
Definition: apsp.cxx:17

CTF::Tensor
an instance of a tensor within a CTF world
Definition: tensor.h:74

CTF::Tensor::write
void write(int64_t npair, int64_t const *global_idx, dtype const *data)
writes in values associated with any set of indices The sparse data is defined in coordinate format...
Definition: tensor.cxx:264

SH
Definition: common.h:37

ctf.core.np
def np(self)
Definition: core.pyx:315