ctf/sparse__permuted__slice_8cxx_source.html

 /*Copyright (c) 2011, Edgar Solomonik, all rights reserved.*/
 #include <ctf.hpp>
 using namespace CTF;
 int sparse_permuted_slice(int     n,
                           int     b,
                           int     sym,
                           World & dw){
   int np, rank, pass, bi;
   int64_t i, j, nvals;
   int64_t * indices;
   double * data;
   int * perm;
   int ** perms;

   MPI_Comm_rank(MPI_COMM_WORLD, &rank);
   MPI_Comm_size(MPI_COMM_WORLD, &np);

   perms = (int**)malloc(sizeof(int*)*2);

   srand(rank*13+7);

   //make each block have somewhat different size
   bi = b + (rand()%b);

   perm = (int*)malloc(sizeof(int)*bi);
   perms[0] = perm;
   perms[1] = perm;

   //each block is random permuted symmetric submatrix
   for (i=0; i<bi; i++){
     int cont = 1;
     while (cont){
       perm[i] = rand()%n;
       cont = 0;
       for (j=0; j<i; j++){
         if (perm[i] == perm[j]) cont = 1;
       }
     }
   }

   Matrix<> A(n, n, sym, dw, "A");

   World id_world(MPI_COMM_SELF);

   Matrix<> B(bi, bi, sym, id_world, "B");

   B.get_local_data(&nvals, &indices, &data);

   srand48(rank*29+3);
   for (i=0; i<nvals; i++){
     data[i] = drand48();
   }
   B.write(nvals, indices, data);
   free(indices);
   delete [] data;


   // this is the main command that does the sparse write

   double t_str, t_stp;
   if (rank == 0)
     t_str = MPI_Wtime();

   A.permute(1.0, B, perms, 1.0);
   if (rank == 0){
     t_stp = MPI_Wtime();
     printf("permute took %lf sec\n", t_stp-t_str);
   }


   // Everything below is simply to test the above permute call,
   // which is hard since there are overlapped writes

   int lens_Arep[3] = {n,n,np};
   int symm[3] = {sym,NS,NS};
   int lens_B3[3] = {bi,bi,1};

   Tensor<> A_rep(3, lens_Arep, symm, dw, "A_rep");
   Tensor<> B3(3, lens_B3, symm, id_world, "B3");

   B3["ijk"] = B["ij"];


   int ** perms_rep;

   perms_rep = (int**)malloc(sizeof(int*)*3);

   perms_rep[0] = perm;
   perms_rep[1] = perm;
   perms_rep[2] = &rank;

   // Writeinto a 3D tensor to avoid overlapped writes
   A_rep.permute(1.0, B3, perms_rep, 1.0);
   // Retrieve the data I wrote from B3 into A_rep back into callback_B3
   Tensor<> callback_B3(3, lens_B3, symm, id_world, "cB3");
   callback_B3.permute(perms_rep, 1.0, A_rep, 1.0);


   // Check that B == callback_B3
   callback_B3["ij"] = callback_B3["ij"] - B["ij"];
   //callback_B3["ij"] -= B["ij"];

   pass = callback_B3.norm2() < 1.E-10;

   if (!pass){
     if (rank == 0){
       printf("Callback from permuted write returned incorrect values\n");
       printf("{ sparse permuted slice among multiple worlds } failed\n");
     }
     return 0;
   }

   // Check that if we sum over the replicated dimension we get the same thing
   // as in the original sparse write
   Matrix<> ERR(n, n, sym, dw);
   ERR["ij"] = A_rep["ijk"] - A["ij"];

   pass = ERR.norm2() < 1.E-10;

   MPI_Allreduce(MPI_IN_PLACE, &pass, 1, MPI_INT, MPI_MIN, MPI_COMM_WORLD);

   if (rank == 0){
     if (pass)
       printf("{ sparse permuted slice among multiple worlds } passed\n");
     else
       printf("{ sparse permuted slice among multiple worlds } failed\n");
   }
   return pass;
 }


 #ifndef TEST_SUITE
 char* getCmdOption(char ** begin,
                    char ** end,
                    const   std::string & option){
   char ** itr = std::find(begin, end, option);
   if (itr != end && ++itr != end){
     return *itr;
   }
   return 0;
 }

 int main(int argc, char ** argv){
   int rank, np, n, b;
   int const in_num = argc;
   char ** input_str = argv;

   MPI_Init(&argc, &argv);
   MPI_Comm_rank(MPI_COMM_WORLD, &rank);
   MPI_Comm_size(MPI_COMM_WORLD, &np);

   if (getCmdOption(input_str, input_str+in_num, "-n")){
     n = atoi(getCmdOption(input_str, input_str+in_num, "-n"));
     if (n < 0) n = 256;
   } else n = 256;

   if (getCmdOption(input_str, input_str+in_num, "-b")){
     b = atoi(getCmdOption(input_str, input_str+in_num, "-b"));
     if (b < 0) b = 16;
   } else b = 16;

   {
     World dw(MPI_COMM_WORLD, argc, argv);
     int pass;
     if (rank == 0){
       printf("Testing nonsymmetric multiworld permutation with n=%d\n",n);
     }
     pass = sparse_permuted_slice(n, b, NS, dw);
     assert(pass);
     if (rank == 0){
       printf("Testing symmetric multiworld permutation with n=%d\n",n);
     }
     pass = sparse_permuted_slice(n, b, SY, dw);
     assert(pass);
     if (rank == 0){
       printf("Testing symmetric-hollow multiworld permutation with n=%d\n",n);
     }
     pass = sparse_permuted_slice(n, b, SH, dw);
     assert(pass);
     if (rank == 0){
       printf("Testing asymmetric multiworld permutation with n=%d\n",n);
     }
     pass = sparse_permuted_slice(n, b, AS, dw);
     assert(pass);
   }

   MPI_Finalize();
   return 0;
 }

 #endif
sparse_permuted_slice
int sparse_permuted_slice(int n, int b, int sym, World &dw)
tests sparse remote global write via permute function
Definition: sparse_permuted_slice.cxx:18

ctf.hpp

CTF::Matrix
Matrix class which encapsulates a 2D tensor.
Definition: matrix.h:18

ctf.core.rank
def rank(self)
Definition: core.pyx:312

CTF::Tensor::permute
void permute(dtype beta, CTF_int::tensor &A, int *const *perms_A, dtype alpha)
Apply permutation to matrix, potentially extracting a slice B[i,j,...] = beta*B[...] + alpha*A[perms_A[0][i],perms_A[1][j],...].
Definition: tensor.cxx:429

ctf.core.b
b
Definition: core.pyx:386

NS
Definition: common.h:37

CTF::World
an instance of the CTF library (world) on a MPI communicator
Definition: world.h:19

ctf.core.string
string
Definition: core.pyx:456

CTF::Tensor::norm2
dtype norm2()
computes the frobenius norm of the tensor (needs sqrt()!)
Definition: tensor.h:811

getCmdOption
char * getCmdOption(char **begin, char **end, const std::string &option)
Definition: sparse_permuted_slice.cxx:147

main
int main(int argc, char **argv)
Definition: sparse_permuted_slice.cxx:157

CTF::Tensor::get_local_data
void get_local_data(int64_t *npair, int64_t **global_idx, dtype **data, bool nonzeros_only=false, bool unpack_sym=false) const
Gives the global indices and values associated with the local data.
Definition: tensor.cxx:159

CTF
Definition: apsp.cxx:17

CTF::Tensor
an instance of a tensor within a CTF world
Definition: tensor.h:74

SY
Definition: common.h:37

AS
Definition: common.h:37

CTF::Tensor::write
void write(int64_t npair, int64_t const *global_idx, dtype const *data)
writes in values associated with any set of indices The sparse data is defined in coordinate format...
Definition: tensor.cxx:264

SH
Definition: common.h:37

ctf.core.np
def np(self)
Definition: core.pyx:315