ctf/tensor_8cxx_source.html

 /*Copyright (c) 2011, Edgar Solomonik, all rights reserved.*/

 #include "../interface/common.h"
 #include "world.h"
 #include "idx_tensor.h"
 #include "../tensor/untyped_tensor.h"


 namespace CTF {

   template<typename dtype>
   Tensor<dtype>::Tensor() : CTF_int::tensor() { }


   template<typename dtype>
   Tensor<dtype>::Tensor(int                       order,
                         int const *               len,
                         int const *               sym,
                         World &                   world,
                         char const *              name,
                         bool                      profile,
                         CTF_int::algstrct const & sr)
     : CTF_int::tensor(&sr, order, len, sym, &world, 1, name, profile) {
     IASSERT(sizeof(dtype)==this->sr->el_size);
   }

   template<typename dtype>
   Tensor<dtype>::Tensor(int                       order,
                         int const *               len,
                         int const *               sym,
                         World &                   world,
                         CTF_int::algstrct const & sr,
                         char const *              name,
                         bool                      profile)
     : CTF_int::tensor(&sr, order, len, sym, &world, 1, name, profile) {
     IASSERT(sizeof(dtype)==this->sr->el_size);
   }


   template<typename dtype>
   Tensor<dtype>::Tensor(int                       order,
                         bool                      is_sparse,
                         int const *               len,
                         int const *               sym,
                         World &                   world,
                         CTF_int::algstrct const & sr,
                         char const *              name,
                         bool                      profile)
     : CTF_int::tensor(&sr, order, len, sym, &world, 1, name, profile, is_sparse) {
     IASSERT(sizeof(dtype)==this->sr->el_size);
   }

   template<typename dtype>
   Tensor<dtype>::Tensor(int                       order,
                         bool                      is_sparse,
                         int const *               len,
                         World &                   world,
                         CTF_int::algstrct const & sr,
                         char const *              name,
                         bool                      profile)
     : CTF_int::tensor(&sr, order, len, NULL, &world, 1, name, profile, is_sparse) {
     IASSERT(sizeof(dtype)==this->sr->el_size);
   }


   template<typename dtype>
   Tensor<dtype>::Tensor(int                       order,
                         int const *               len,
                         World &                   world,
                         CTF_int::algstrct const & sr,
                         char const *              name,
                         bool                      profile)
     : CTF_int::tensor(&sr, order, len, NULL, &world, 1, name, profile) {
     IASSERT(sizeof(dtype)==this->sr->el_size);
   }


   template<typename dtype>
   Tensor<dtype>::Tensor(int                       order,
                         int const *               len,
                         int const *               sym,
                         World &                   world,
                         char const *              idx,
                         Idx_Partition const &     prl,
                         Idx_Partition const &     blk,
                         char const *              name,
                         bool                      profile,
                         CTF_int::algstrct const & sr_)
     : CTF_int::tensor(&sr_, order, 0, len, sym, &world, idx, prl, blk, name, profile) {
     IASSERT(sizeof(dtype)==this->sr->el_size);
   }

   template<typename dtype>
   Tensor<dtype>::Tensor(int                       order,
                         bool                      is_sparse_,
                         int const *               len,
                         int const *               sym,
                         World &                   world,
                         char const *              idx,
                         Idx_Partition const &     prl,
                         Idx_Partition const &     blk,
                         char const *              name,
                         bool                      profile,
                         CTF_int::algstrct const & sr_)
     : CTF_int::tensor(&sr_, order, is_sparse_, len, sym, &world, idx, prl, blk, name, profile) {
     IASSERT(sizeof(dtype)==this->sr->el_size);
   }


   template<typename dtype>
   Tensor<dtype>::Tensor(bool           copy,
                                 tensor const & A)
     : CTF_int::tensor(&A, copy) { }

   template<typename dtype>
   Tensor<dtype>::Tensor(Tensor<dtype> const & A)
     : CTF_int::tensor(&A, true) { }

   template<typename dtype>
   Tensor<dtype>::Tensor(tensor const & A)
     : CTF_int::tensor(&A, true) { }

   template<typename dtype>
   Tensor<dtype>::Tensor(tensor const & A,
                         World &        world_)
     : CTF_int::tensor(A.sr, A.order, A.lens, A.sym, &world_, 1, A.name, A.profile) { }

   template<typename dtype>
   Tensor<dtype>::Tensor(tensor &    A,
                         int const * new_sym)
     : CTF_int::tensor(&A, new_sym){ }

   template<typename dtype>
   Typ_Idx_Tensor<dtype> Tensor<dtype>::operator[](const char * idx_map_){
     //IASSERT(strlen(idx_map_)==order);
     Typ_Idx_Tensor<dtype> idxtsr(this, idx_map_);
     return idxtsr;
   }

   template<typename dtype>
   Typ_Idx_Tensor<dtype> Tensor<dtype>::i(const char * idx_map_){
     //IASSERT(strlen(idx_map_)==order);
     Typ_Idx_Tensor<dtype> idxtsr(this, idx_map_);
     return idxtsr;
   }


   template<typename dtype>
   Tensor<dtype>::~Tensor(){ }

   template<typename dtype>
   dtype * Tensor<dtype>::get_raw_data(int64_t * size) const {
     dtype * data;
     tensor::get_raw_data((char**)&data, size);
     return data;
   }

   template<typename dtype>
   void Tensor<dtype>::get_local_data(int64_t *  npair,
                                      int64_t ** global_idx,
                                      dtype **   data,
                                      bool       nonzeros_only,
                                      bool       unpack_sym) const {
     char * cpairs;
     int ret, i;
     if (nonzeros_only)
       ret = CTF_int::tensor::read_local_nnz(npair,&cpairs,unpack_sym);
     else
       ret = CTF_int::tensor::read_local(npair,&cpairs,unpack_sym);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read_local\n"); IASSERT(0); return; }
     *global_idx = (int64_t*)CTF_int::alloc((*npair)*sizeof(int64_t));
     *data = (dtype*)sr->alloc((*npair));
     CTF_int::PairIterator pairs(sr, cpairs);
     for (i=0; i<(*npair); i++){
       (*global_idx)[i] = pairs[i].k();
       pairs[i].read_val((char*)((*data)+i));
     }
     if (cpairs != NULL) sr->pair_dealloc(cpairs);
   }

   template<typename dtype>
   void Tensor<dtype>::read_local(int64_t *  npair,
                                  int64_t ** global_idx,
                                  dtype **   data,
                                  bool       unpack_sym) const {
     char * cpairs;
     int ret, i;
     ret = CTF_int::tensor::read_local(npair,&cpairs,unpack_sym);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read_local\n"); IASSERT(0); return; }
     *global_idx = (int64_t*)CTF_int::alloc((*npair)*sizeof(int64_t));
     *data = (dtype*)CTF_int::alloc((*npair)*sizeof(dtype));
     CTF_int::PairIterator pairs(sr, cpairs);
     for (i=0; i<(*npair); i++){
       (*global_idx)[i] = pairs[i].k();
       pairs[i].read_val((char*)((*data)+i));
     }
     if (cpairs != NULL) sr->pair_dealloc(cpairs);
   }

   template<typename dtype>
   void Tensor<dtype>::get_local_pairs(int64_t *      npair,
                                       Pair<dtype> ** pairs,
                                       bool           nonzeros_only,
                                       bool           unpack_sym) const {
     char * cpairs;
     int ret;
     if (nonzeros_only)
       ret = CTF_int::tensor::read_local_nnz(npair,&cpairs,unpack_sym);
     else
       ret = CTF_int::tensor::read_local(npair,&cpairs,unpack_sym);
     *pairs = (Pair<dtype>*)cpairs; //Pair<dtype>::cast_char_arr(cpairs, *npair, sr);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read_local\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::read_local(int64_t *      npair,
                                  Pair<dtype> ** pairs,
                                  bool           unpack_sym) const {
     char * cpairs;
     int ret = CTF_int::tensor::read_local(npair, &cpairs, unpack_sym);
     *pairs = (Pair<dtype>*)cpairs; //Pair<dtype>::cast_char_arr(cpairs, *npair, sr);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read_local\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::read(int64_t         npair,
                            int64_t const * global_idx,
                            dtype *         data){
     int ret;
     int64_t i;
     char * cpairs = sr->pair_alloc(npair);
     Pair< dtype > * pairs =(Pair< dtype >*)cpairs;
     for (i=0; i<npair; i++){
       pairs[i].k = global_idx[i];
       pairs[i].d = data[i];
     }
     ret = CTF_int::tensor::read(npair, cpairs);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read\n"); IASSERT(0); return; }
     for (i=0; i<npair; i++){
       data[i] = pairs[i].d;
     }
     sr->pair_dealloc(cpairs);
   }

   template<typename dtype>
   void Tensor<dtype>::read(int64_t       npair,
                            Pair<dtype> * pairs){
     //FIXME raises mem consumption
     //char * cpairs = Pair<dtype>::scast_to_char_arr(pairs, npair);
     char * cpairs = (char*)pairs; //Pair<dtype>::scast_to_char_arr(pairs, npair);
     int ret = CTF_int::tensor::read(npair, cpairs);
     IASSERT(cpairs == (char*)pairs);
     /*if (cpairs != (char*)pairs){
       for (int64_t i=0; i<npair; i++){
         pairs[i].k = ipairs[i].k();
         ipairs[i].read_val((char*)&(pairs[i].d));
       }
       sr->pair_dealloc(cpairs);
     }*/
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::write(int64_t         npair,
                             int64_t const * global_idx,
                             dtype const *   data) {
     int ret, i;
     char * cpairs = sr->pair_alloc(npair);
     Pair< dtype > * pairs =(Pair< dtype >*)cpairs;
     for (i=0; i<npair; i++){
       pairs[i].k = global_idx[i];
       pairs[i].d = data[i];
     }
     /*char * cpairs = sr->pair_alloc(npair);
     CTF_int::PairIterator pairs = CTF_int::PairIterator(sr, cpairs);
     for (i=0; i<npair; i++){
       pairs[i].write_key(global_idx[i]);
       pairs[i].write_val((char*)&(data[i]));
     }*/
     ret = CTF_int::tensor::write(npair, sr->mulid(), sr->addid(), cpairs);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function write\n"); IASSERT(0); return; }
     sr->pair_dealloc(cpairs);
   }

   template<typename dtype>
   void Tensor<dtype>::write(int64_t             npair,
                             Pair<dtype> const * pairs) {

     //FIXME raises mem consumption
     char const * cpairs = (char const*)pairs; //Pair<dtype>::scast_to_char_arr(pairs, npair);
     int ret = CTF_int::tensor::write(npair, sr->mulid(), sr->addid(), (char*)cpairs);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function write\n"); IASSERT(0); return; }
     /*if (cpairs != (char*)pairs)
       sr->pair_dealloc(cpairs);*/
   }

   template<typename dtype>
   void Tensor<dtype>::write(int64_t         npair,
                             dtype           alpha,
                             dtype           beta,
                             int64_t const * global_idx,
                             dtype const *   data) {
     int ret, i;
     char * cpairs = sr->pair_alloc(npair);
     Pair< dtype > * pairs =(Pair< dtype >*)cpairs;

     for (i=0; i<npair; i++){
       pairs[i].k = global_idx[i];
       pairs[i].d = data[i];
     }

     /*Pair< dtype > * pairs;
     pairs = (Pair< dtype >*)CTF_int::alloc(npair*sizeof(Pair< dtype >));
     for (i=0; i<npair; i++){
       pairs[i].k = global_idx[i];
       pairs[i].d = data[i];
     }*/
     ret = CTF_int::tensor::write(npair, (char*)&alpha, (char*)&beta, cpairs);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function write\n"); IASSERT(0); return; }
     sr->pair_dealloc(cpairs);
   }

   template<typename dtype>
   void Tensor<dtype>::write(int64_t             npair,
                             dtype               alpha,
                             dtype               beta,
                             Pair<dtype> const * pairs) {
     char const * cpairs = (char const*)pairs; //Pair<dtype>::scast_to_char_arr(pairs, npair);

     int ret = CTF_int::tensor::write(npair, (char*)&alpha, (char*)&beta, (char*)cpairs);
     //if (cpairs != (char*)pairs) sr->pair_dealloc(cpairs);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function write\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::read(int64_t         npair,
                            dtype           alpha,
                            dtype           beta,
                            int64_t const * global_idx,
                            dtype *         data){
     int ret, i;
     char * cpairs = sr->pair_alloc(npair);
     Pair< dtype > * pairs =(Pair< dtype >*)cpairs;
     for (i=0; i<npair; i++){
       pairs[i].k = global_idx[i];
       pairs[i].d = data[i];
     }
     ret = CTF_int::tensor::read(npair, (char*)&alpha, (char*)&beta, cpairs);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read\n"); IASSERT(0); return; }
     for (i=0; i<npair; i++){
       data[i] = pairs[i].d;
     }
     sr->pair_dealloc(cpairs);
   }

   template<typename dtype>
   void Tensor<dtype>::read(int64_t       npair,
                            dtype         alpha,
                            dtype         beta,
                            Pair<dtype> * pairs){
     char * cpairs = (char*)pairs; //Pair<dtype>::scast_to_char_arr(pairs, npair);
     int ret = CTF_int::tensor::read(npair, (char*)&alpha, (char*)&beta, cpairs);
     IASSERT(cpairs == (char*)pairs);/*
     {
       CTF_int::PairIterator ipairs = CTF_int::PairIterator(sr, cpairs);
       for (int64_t i=0; i<npair; i++){
         pairs[i].k = ipairs[i].k();
         ipairs[i].read_val((char*)&(pairs[i].d()));
       }
       sr->pair_dealloc(cpairs);
     }*/
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read\n"); IASSERT(0); return; }
   }


   template<typename dtype>
   void Tensor<dtype>::read_all(int64_t * npair, dtype ** vals, bool unpack){
     int ret;
     ret = CTF_int::tensor::allread(npair, ((char**)vals), unpack);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read_all\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   int64_t Tensor<dtype>::read_all(dtype * vals, bool unpack){
     int ret;
     int64_t npair;
     ret = CTF_int::tensor::allread(&npair, (char*)vals, unpack);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function read_all\n"); IASSERT(0); }
     return npair;
   }
   template<typename dtype>
   void Tensor<dtype>::set_name(char const * name_) {
     CTF_int::tensor::set_name(name_);
   }

   template<typename dtype>
   void Tensor<dtype>::profile_on() {
     CTF_int::tensor::profile_on();
   }

   template<typename dtype>
   void Tensor<dtype>::profile_off() {
     CTF_int::tensor::profile_off();
   }

   template<typename dtype>
   void Tensor<dtype>::print(FILE* fp, dtype cutoff) const{
     CTF_int::tensor::print(fp, (char *)&cutoff);
   }

   template<typename dtype>
   void Tensor<dtype>::print(FILE* fp) const{
     CTF_int::tensor::print(fp, NULL);
   }

   template<typename dtype>
   void Tensor<dtype>::prnt() const{
     CTF_int::tensor::print(stdout, NULL);
   }


   template<typename dtype>
   void Tensor<dtype>::compare(const Tensor<dtype>& A, FILE* fp, double cutoff){
     CTF_int::tensor::compare(&A, fp, (char const *)&cutoff);
   }

   template<typename dtype>
   void Tensor<dtype>::permute(dtype             beta,
                               CTF_int::tensor & A,
                               int * const *     perms_A,
                               dtype             alpha){
     int ret = CTF_int::tensor::permute(&A, perms_A, (char*)&alpha,
                                        NULL, (char*)&beta);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::permute(int * const *     perms_B,
                               dtype             beta,
                               CTF_int::tensor & A,
                               dtype             alpha){
     int ret = CTF_int::tensor::permute(&A, NULL, (char*)&alpha,
                                        perms_B, (char*)&beta);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function permute\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::sparsify(){
     int ret = CTF_int::tensor::sparsify();
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function sparsify\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::sparsify(dtype threshold, bool take_abs){
     int ret = CTF_int::tensor::sparsify((char*)&threshold, take_abs);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function sparsify\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::sparsify(std::function<bool(dtype)> filter){
     int ret = CTF_int::tensor::sparsify([&](char const * c){ return filter(((dtype*)c)[0]); });
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function sparisfy\n"); IASSERT(0); return; }
   }

   template <typename dtype>
   void read_sparse_from_file_base(const char * fpath, bool with_vals, Tensor<dtype> * T){
     char ** datastr;
     int64_t my_nvals = CTF_int::read_data_mpiio<dtype>(T->wrld, fpath, &datastr);

     Pair<dtype> * pairs = (Pair<dtype>*)T->sr->pair_alloc(my_nvals);

     CTF_int::parse_sparse_tensor_data<dtype>(datastr, T->order, (dtype*)T->sr->mulid(), T->lens, my_nvals, pairs, with_vals);

     //strtok contains pointers to char array generated from file
     if (datastr[0] != NULL) CTF_int::cdealloc(datastr[0]);
     CTF_int::cdealloc(datastr);

     T->write(my_nvals,pairs);

     T->sr->pair_dealloc((char*)pairs);
   }

   template<>
   inline void Tensor<int>::read_sparse_from_file(const char * fpath, bool with_vals){
     read_sparse_from_file_base<int>(fpath, with_vals, this);
   }

   template<>
   inline void Tensor<double>::read_sparse_from_file(const char * fpath, bool with_vals){
     read_sparse_from_file_base<double>(fpath, with_vals, this);
   }

   template<>
   inline void Tensor<float>::read_sparse_from_file(const char * fpath, bool with_vals){
     read_sparse_from_file_base<float>(fpath, with_vals, this);
   }

   template<>
   inline void Tensor<int64_t>::read_sparse_from_file(const char * fpath, bool with_vals){
     read_sparse_from_file_base<int64_t>(fpath, with_vals, this);
   }


   template <typename dtype>
   void write_sparse_to_file_base(const char * fpath, bool with_vals, Tensor<dtype> * T){
     int64_t my_nvals;

     Pair<dtype> * pairs;
     T->get_local_pairs(&my_nvals, &pairs, true);
     int64_t str_len;
     char * datastr = CTF_int::serialize_sparse_tensor_data<dtype>(T->order, T->lens, my_nvals, pairs, with_vals, str_len);
     CTF_int::write_data_mpiio<dtype>(T->wrld, fpath, datastr, str_len);
     CTF_int::cdealloc(datastr);
     T->sr->pair_dealloc((char*)pairs);
   }

   template<>
   inline void Tensor<int>::write_sparse_to_file(const char * fpath, bool with_vals){
     write_sparse_to_file_base<int>(fpath, with_vals, this);
   }

   template<>
   inline void Tensor<double>::write_sparse_to_file(const char * fpath, bool with_vals){
     write_sparse_to_file_base<double>(fpath, with_vals, this);
   }

   template<>
   inline void Tensor<float>::write_sparse_to_file(const char * fpath, bool with_vals){
     write_sparse_to_file_base<float>(fpath, with_vals, this);
   }

   template<>
   inline void Tensor<int64_t>::write_sparse_to_file(const char * fpath, bool with_vals){
     write_sparse_to_file_base<int64_t>(fpath, with_vals, this);
   }


   template<typename dtype>
   void Tensor<dtype>::add_to_subworld(
                                      Tensor<dtype> * tsr,
                                      dtype                   alpha,
                                      dtype                   beta){
     if (tsr == NULL){
       tensor t = tensor();
       t.sr = sr->clone();
       CTF_int::tensor::add_to_subworld(&t, (char*)&alpha, (char*)&beta);
       delete t.sr;
     } else
       CTF_int::tensor::add_to_subworld(tsr, (char*)&alpha, (char*)&beta);
   }

   template<typename dtype>
   void Tensor<dtype>::add_to_subworld(
                            Tensor<dtype> * tsr){
     return add_to_subworld(tsr, sr->mulid(), sr->mulid());
   }

   template<typename dtype>
   void Tensor<dtype>::add_from_subworld(
                                  Tensor<dtype> * tsr,
                                  dtype                   alpha,
                                  dtype                   beta){
     if (tsr == NULL){
       tensor t = tensor();
       t.sr = sr->clone();
       CTF_int::tensor::add_from_subworld(&t, (char*)&alpha, (char*)&beta);
       delete t.sr;
     } else
       CTF_int::tensor::add_from_subworld(tsr, (char*)&alpha, (char*)&beta);
   }

   template<typename dtype>
   void Tensor<dtype>::add_from_subworld(
                            Tensor<dtype> * tsr){
     if (tsr == NULL){
       tensor t = tensor();
       t.sr = sr->clone();
       CTF_int::tensor::add_from_subworld(&t, sr->mulid(), sr->mulid());
       delete t.sr;
     } else
       CTF_int::tensor::add_from_subworld(tsr, sr->mulid(), sr->mulid());
   }

   template<typename dtype>
   void Tensor<dtype>::slice(int const *             offsets,
                             int const *             ends,
                             dtype                   beta,
                             CTF_int::tensor const & A,
                             int const *             offsets_A,
                             int const *             ends_A,
                             dtype                   alpha){
     int np_A, np_B;
     if (A.wrld->comm != wrld->comm){
       MPI_Comm_size(A.wrld->comm, &np_A);
       MPI_Comm_size(wrld->comm,   &np_B);
       if (np_A == np_B){
         printf("CTF ERROR: number of processors should not match in slice if worlds are different\n");
         IASSERT(0);
         return;
       }
       //FIXME: was reversed?
       CTF_int::tensor::slice(
           offsets, ends, (char*)&beta, (Tensor *)&A,
           offsets_A, ends_A, (char*)&alpha);
     } else {
       CTF_int::tensor::slice(
           offsets, ends, (char*)&beta, (Tensor *)&A,
           offsets_A, ends_A, (char*)&alpha);
     }
   }

   template<typename dtype>
   void Tensor<dtype>::slice(int64_t                 corner_off,
                             int64_t                 corner_end,
                             dtype                   beta,
                             CTF_int::tensor const & A,
                             int64_t                 corner_off_A,
                             int64_t                 corner_end_A,
                             dtype                   alpha){
     int * offsets, * ends, * offsets_A, * ends_A;

     CTF_int::cvrt_idx(this->order, this->lens, corner_off, &offsets);
     CTF_int::cvrt_idx(this->order, this->lens, corner_end, &ends);
     for (int i=0; i<order; i++){
       ends[i]++;
     }
     CTF_int::cvrt_idx(A.order, A.lens, corner_off_A, &offsets_A);
     CTF_int::cvrt_idx(A.order, A.lens, corner_end_A, &ends_A);
     for (int i=0; i<A.order; i++){
       ends_A[i]++;
     }

     CTF_int::tensor::slice(offsets, ends, (char*)&beta, (Tensor *)&A, offsets_A, ends_A, (char*)&alpha);

     CTF_int::cdealloc(offsets);
     CTF_int::cdealloc(ends);
     CTF_int::cdealloc(offsets_A);
     CTF_int::cdealloc(ends_A);
   }

   template<typename dtype>
   Tensor<dtype> Tensor<dtype>::slice(int const * offsets,
                                      int const * ends) const {

     return slice(offsets, ends, wrld);
   }

   template<typename dtype>
   Tensor<dtype> Tensor<dtype>::slice(int64_t corner_off,
                                      int64_t corner_end) const {

     return slice(corner_off, corner_end, wrld);
   }

   template<typename dtype>
   Tensor<dtype> Tensor<dtype>::slice(int const *  offsets,
                                      int const *  ends,
                                      World *      owrld) const {
     int i;
     int * new_lens = (int*)CTF_int::alloc(sizeof(int)*order);
     int * new_sym = (int*)CTF_int::alloc(sizeof(int)*order);
     for (i=0; i<order; i++){
       if (!(ends[i] - offsets[i] > 0 &&
                   offsets[i] >= 0 &&
                   ends[i] <= lens[i])){
         printf("CTF ERROR: invalid slice dimensions\n");
         IASSERT(0);
         return Tensor<dtype>();
       }
       if (sym[i] != NS){
         if (offsets[i] == offsets[i+1] && ends[i] == ends[i+1]){
           new_sym[i] = sym[i];
         } else {
           if (!(ends[i+1] >= offsets[i])){
             printf("CTF ERROR: slice dimensions don't respect tensor symmetry\n");
             IASSERT(0);
             return Tensor<dtype>();
           }
           new_sym[i] = NS;
         }
       } else new_sym[i] = NS;
       new_lens[i] = ends[i] - offsets[i];
     }
     //FIXME: could discard sr qualifiers
     Tensor<dtype> new_tsr(order, new_lens, new_sym, *owrld, *sr);
 //   Tensor<dtype> new_tsr = tensor(sr, order, new_lens, new_sym, owrld, 1);
     std::fill(new_sym, new_sym+order, 0);
     new_tsr.slice(new_sym, new_lens, *(dtype*)sr->addid(), *this, offsets, ends, *(dtype*)sr->mulid());
 /*    new_tsr.slice(
         new_sym, new_lens, sr->addid(), this,
         offsets, ends, sr->mulid());*/
     CTF_int::cdealloc(new_lens);
     CTF_int::cdealloc(new_sym);
     return new_tsr;
   }

   template<typename dtype>
   Tensor<dtype> Tensor<dtype>::slice(int64_t  corner_off,
                                      int64_t  corner_end,
                                      World *  owrld) const {

     int * offsets, * ends;

     CTF_int::cvrt_idx(this->order, this->lens, corner_off, &offsets);
     CTF_int::cvrt_idx(this->order, this->lens, corner_end, &ends);
     for (int i=0; i<order; i++){
       ends[i]++;
     }

     Tensor<dtype> tsr = slice(offsets, ends, owrld);

     CTF_int::cdealloc(offsets);
     CTF_int::cdealloc(ends);

     return tsr;
   }

   template<typename dtype>
   void Tensor<dtype>::align(const CTF_int::tensor & A){
     if (A.wrld->cdt.cm != wrld->cdt.cm) {
       printf("CTF ERROR: cannot align tensors on different CTF instances\n");
       IASSERT(0);
       return;
     }
     int ret = CTF_int::tensor::align(&A);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function align\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   dtype Tensor<dtype>::reduce(OP op){
     int ret;
     dtype ans;
     switch (op) {
       case OP_SUM:
         if (sr->is_ordered()){
           Semiring<dtype,1> r = Semiring<dtype,1>();
           ret = reduce_sum((char*)&ans, &r);
         } else {
           Semiring<dtype,0> r = Semiring<dtype,0>();
           ret = reduce_sum((char*)&ans, &r);
         }
 //        ret = reduce_sum((char*)&ans);
         break;
       case OP_SUMABS:
         if (sr->is_ordered()){
           Ring<dtype,1> r = Ring<dtype,1>();
           ret = reduce_sumabs((char*)&ans, &r);
         } else {
           Ring<dtype,0> r = Ring<dtype,0>();
           ret = reduce_sumabs((char*)&ans, &r);
         }
         break;
       case OP_SUMSQ:
 /*        if (sr->is_ordered()){
           Ring<dtype,1> r = Ring<dtype,1>();
           ret = reduce_sumsq((char*)&ans, &r);
         } else {
           Ring<dtype,0> r = Ring<dtype,0>();
           ret = reduce_sumsq((char*)&ans, &r);
         }*/
         ret = reduce_sumsq((char*)&ans);
         break;
       case OP_MAX:
         {
           dtype minval;
           sr->min((char*)&minval);
           Monoid<dtype, 1> mmax = Monoid<dtype, 1>(minval, CTF_int::default_max<dtype, 1>, MPI_MAX);
           ret = reduce_sum((char*)&ans, &mmax);
         }
         break;
       case OP_MIN:
         {
           dtype maxval;
           sr->max((char*)&maxval);
           Monoid<dtype, 1> mmin = Monoid<dtype, 1>(maxval, CTF_int::default_min<dtype, 1>, MPI_MIN);
           ret = reduce_sum((char*)&ans, &mmin);
         }
         break;
       case OP_MAXABS:
         {
           dtype minval;
           sr->min((char*)&minval);
           Monoid<dtype, 1> mmax = Monoid<dtype, 1>(minval, CTF_int::default_max<dtype, 1>, MPI_MAX);
           ret = reduce_sumabs((char*)&ans, &mmax);
         }
         break;
       case OP_MINABS:
         {
           dtype maxval;
           sr->max((char*)&maxval);
           Monoid<dtype, 1> mmin = Monoid<dtype, 1>(maxval, CTF_int::default_min<dtype, 1>, MPI_MIN);
           ret = reduce_sumabs((char*)&ans, &mmin);
         }
         break;
     }
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function reduce\n"); IASSERT(0); }
     return ans;
   }


   template<typename dtype>
   void real_norm1(Tensor<dtype> & A, double & nrm){
     char inds[A.order];
     for (int i=0; i<A.order; i++){
       inds[i] = 'a'+i;
     }
     nrm = Function<dtype,double>([](dtype a){ return (double)std::abs(a); })(A[inds]);
   }

   template<>
   inline void real_norm1<bool>(Tensor<bool> & A, double & nrm){
     char inds[A.order];
     for (int i=0; i<A.order; i++){
       inds[i] = 'a'+i;
     }
     nrm = A[inds];
   }


   template<typename dtype>
   void Tensor<dtype>::norm1(double & nrm){
     if (wrld->rank == 0)
       printf("CTF ERROR: norm not available for the type of tensor %s\n",name);
     IASSERT(0);
   }

 #define NORM1_INST(dtype) \
   template<> \
   inline void Tensor<dtype>::norm1(double & nrm){ \
     real_norm1<dtype>(*this, nrm); \
   }

 NORM1_INST(bool)
 NORM1_INST(int8_t)
 NORM1_INST(int16_t)
 NORM1_INST(int)
 NORM1_INST(int64_t)
 NORM1_INST(float)
 NORM1_INST(double)

   template<typename dtype>
   static void real_norm2(Tensor<dtype> & A, double & nrm){
     char inds[A.order];
     for (int i=0; i<A.order; i++){
       inds[i] = 'a'+i;
     }
     //CTF::Scalar<double> dnrm(A.dw);
     nrm = std::sqrt((double)Function<dtype,double>([](dtype a){ return (double)(a*a); })(A[inds]));
   }

   template<typename dtype>
   static void complex_norm2(Tensor<dtype> & A, double & nrm){
     char inds[A.order];
     for (int i=0; i<A.order; i++){
       inds[i] = 'a'+i;
     }
     nrm = std::sqrt((double)Function<dtype,double>([](dtype a){ return (double)std::norm(a); })(A[inds]));
   }


   template<typename dtype>
   void Tensor<dtype>::norm2(double & nrm){
     if (wrld->rank == 0)
       printf("CTF ERROR: norm not available for the type of tensor %s\n",name);
     IASSERT(0);
   }

 #define NORM2_REAL_INST(dtype) \
   template<> \
   inline void Tensor<dtype>::norm2(double & nrm){ \
     real_norm2<dtype>(*this, nrm); \
   }

 #define NORM2_COMPLEX_INST(dtype) \
   template<> \
   inline void Tensor< std::complex<dtype> >::norm2(double & nrm){ \
     complex_norm2< std::complex<dtype> >(*this, nrm); \
   }


 NORM2_REAL_INST(bool)
 NORM2_REAL_INST(int8_t)
 NORM2_REAL_INST(int16_t)
 NORM2_REAL_INST(int)
 NORM2_REAL_INST(int64_t)
 NORM2_REAL_INST(float)
 NORM2_REAL_INST(double)
 NORM2_COMPLEX_INST(float)
 NORM2_COMPLEX_INST(double)

   template<typename dtype>
   void Tensor<dtype>::norm_infty(double & nrm){
     if (wrld->rank == 0)
       printf("CTF ERROR: norm not available for the type of tensor %s\n",name);
     IASSERT(0);
   }

 #define NORM_INFTY_INST(dtype) \
   template<> \
   inline void Tensor<dtype>::norm_infty(double & nrm){ \
     nrm = this->norm_infty(); \
   }

 NORM_INFTY_INST(bool)
 NORM_INFTY_INST(int8_t)
 NORM_INFTY_INST(int16_t)
 NORM_INFTY_INST(int)
 NORM_INFTY_INST(int64_t)
 NORM_INFTY_INST(float)
 NORM_INFTY_INST(double)

 #undef NORM1_INST
 #undef NORM2_REAL_INST
 #undef NORM2_COMPLEX_INST
 #undef NORM_INFTY_INST

   template<typename dtype>
   void Tensor<dtype>::get_max_abs(int     n,
                                   dtype * data) const {
     int ret;
     ret = CTF_int::tensor::get_max_abs(n, data);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function get_max_abs\n"); IASSERT(0); return; }
   }

   template<typename dtype>
   void Tensor<dtype>::fill_random(dtype rmin, dtype rmax){
     if (wrld->rank == 0)
       printf("CTF ERROR: fill_random(rmin, rmax) not available for the type of tensor %s\n",name);
     IASSERT(0);
   }

   template <typename dtype>
   void fill_random_base(dtype rmin, dtype rmax, Tensor<dtype> & T){
     if (T.is_sparse){
       printf("CTF ERROR: fill_random should not be called on a sparse tensor, use fill_random_sp instead\n");
       IASSERT(0);
       return;
     }
     for (int64_t i=0; i<T.size; i++){
       ((dtype*)T.data)[i] = CTF_int::get_rand48()*(rmax-rmin)+rmin;
     }
     T.zero_out_padding();
   }

   template<>
   inline void Tensor<double>::fill_random(double rmin, double rmax){
     fill_random_base<double>(rmin, rmax, *this);
   }

   template<>
   inline void Tensor<float>::fill_random(float rmin, float rmax){
     fill_random_base<float>(rmin, rmax, *this);
   }

   template<>
   inline void Tensor<int64_t>::fill_random(int64_t rmin, int64_t rmax){
     fill_random_base<int64_t>(rmin, rmax, *this);
   }

   template<>
   inline void Tensor<int>::fill_random(int rmin, int rmax){
     fill_random_base<int>(rmin, rmax, *this);
   }


   template<typename dtype>
   void Tensor<dtype>::fill_sp_random(dtype rmin, dtype rmax, double frac_sp){
     if (wrld->rank == 0)
       printf("CTF ERROR: fill_sp_random(rmin, rmax, frac_sp) not available for the type of tensor %s\n",name);
     IASSERT(0);
   }

   template <typename dtype>
   void fill_sp_random_base(dtype rmin, dtype rmax, double frac_sp, Tensor<dtype> * T){
     int64_t tot_size = 1; //CTF_int::packed_size(T.order, T.lens, T.sym);
     for (int i=0; i<T->order; i++) tot_size *= T->lens[i];
     double sf = tot_size*frac_sp;
     double dg = 0.0;
     //generate approximately tot_size*e^frac_sp rather than tot_size*frac_sp elements, to account for conflicts in writing them
     for (int i=2; i<20; i++){
       dg += sf;
       sf *= frac_sp/i;
     }
     int64_t gen_size = (int64_t)(dg+.5);
     int64_t my_gen_size = gen_size/T->wrld->np;
     if (gen_size % T->wrld->np > T->wrld->rank){
       my_gen_size++;
     }
     Pair<dtype> * pairs = (Pair<dtype>*)T->sr->pair_alloc(my_gen_size);
     for (int64_t i=0; i<my_gen_size; i++){
       pairs[i] = Pair<dtype>((int64_t)(CTF_int::get_rand48()*tot_size), 1.0);
     }
     T->write(my_gen_size,pairs);
     T->sr->pair_dealloc((char*)pairs);
     char str[T->order];
     for (int i=0; i<T->order; i++){
       str[i] = 'a'+i;
     }

     Transform<dtype>([=](dtype & d){ d=CTF_int::get_rand48()*(rmax-rmin)+rmin; })(T->operator[](str));

     /*std::vector<Pair<dtype>> pairs;
     pairs.reserve(size*frac_sp);
     int64_t npairs=0;
     for (int64_t i=wrld->rank; i<tot_sz; i+=wrld->np){
       if (CTF_int::get_rand48() < frac_sp){
         pairs.push_back(Pair<dtype>(i,CTF_int::get_rand48()*(rmax-rmin)+rmin));
         npairs++;
       }
     }
     this->write(npairs, pairs.data());*/

   }

   template<>
   inline void Tensor<double>::fill_sp_random(double rmin, double rmax, double frac_sp){
     fill_sp_random_base<double>(rmin, rmax, frac_sp, this);
   }

   template<>
   inline void Tensor<float>::fill_sp_random(float rmin, float rmax, double frac_sp){
     fill_sp_random_base<float>(rmin, rmax, frac_sp, this);
   }

   template<>
   inline void Tensor<int>::fill_sp_random(int rmin, int rmax, double frac_sp){
     fill_sp_random_base<int>(rmin, rmax, frac_sp, this);
   }

   template<>
   inline void Tensor<int64_t>::fill_sp_random(int64_t rmin, int64_t rmax, double frac_sp){
     fill_sp_random_base<int64_t>(rmin, rmax, frac_sp, this);
   }

   template<typename dtype>
   void Tensor<dtype>::contract(dtype            alpha,
                                CTF_int::tensor& A,
                                const char *     idx_A,
                                CTF_int::tensor& B,
                                const char *     idx_B,
                                dtype            beta,
                                const char *     idx_C){
     if (A.wrld->cdt.cm != wrld->cdt.cm || B.wrld->cdt.cm != wrld->cdt.cm){
       printf("CTF ERROR: worlds of contracted tensors must match\n");
       IASSERT(0);
       return;
     }
     CTF_int::contraction ctr
       = CTF_int::contraction(&A, idx_A, &B, idx_B, (char*)&alpha, this, idx_C, (char*)&beta);
     ctr.execute();
   }

   template<typename dtype>
   void Tensor<dtype>::contract(dtype                 alpha,
                                CTF_int::tensor&      A,
                                const char *          idx_A,
                                CTF_int::tensor&      B,
                                const char *          idx_B,
                                dtype                 beta,
                                const char *          idx_C,
                                Bivar_Function<dtype> fseq){
     if (A.wrld->cdt.cm != wrld->cdt.cm || B.wrld->cdt.cm != wrld->cdt.cm){
       printf("CTF ERROR: worlds of contracted tensors must match\n");
       IASSERT(0);
       return;
     }
     CTF_int::contraction ctr
       = CTF_int::contraction(&A, idx_A, &B, idx_B, (char const *)&alpha, this, idx_C, (char const *)&beta, &fseq);
     ctr.execute();
   }


   template<typename dtype>
   void Tensor<dtype>::sum(dtype            alpha,
                           CTF_int::tensor& A,
                           const char *     idx_A,
                           dtype            beta,
                           const char *     idx_B){
     if (A.wrld->cdt.cm != wrld->cdt.cm){
       printf("CTF ERROR: worlds of summed tensors must match\n");
       IASSERT(0);
       return;
     }

     CTF_int::summation sum
       = CTF_int::summation(&A, idx_A, (char*)&alpha, this, idx_B, (char*)&beta);

     sum.execute();

   }

   template<typename dtype>
   void Tensor<dtype>::sum(dtype                  alpha,
                           CTF_int::tensor&       A,
                           const char *           idx_A,
                           dtype                  beta,
                           const char *           idx_B,
                           Univar_Function<dtype> fseq){
     if (A.wrld->cdt.cm != wrld->cdt.cm){
       printf("CTF ERROR: worlds of summed tensors must match\n");
       IASSERT(0);
       return;
     }

     CTF_int::summation sum = CTF_int::summation(&A, idx_A, (char const *)&alpha, this, idx_B, (char const *)&beta, &fseq);

     sum.execute();
   }

   template<typename dtype>
   void Tensor<dtype>::scale(dtype        alpha,
                             const char * idx_A){
     CTF_int::scaling scl = CTF_int::scaling(this, idx_A, (char*)&alpha);
     scl.execute();
   }


   template<typename dtype>
   void Tensor<dtype>::scale(dtype               alpha,
                             const char *        idx_A,
                             Endomorphism<dtype> fseq){
     CTF_int::scaling scl = CTF_int::scaling(this, idx_A, &fseq, (char const *)&alpha);
     scl.execute();
   }

   template<typename dtype>
   dtype * Tensor<dtype>::get_mapped_data(char const *          idx,
                                          Idx_Partition const & prl,
                                          Idx_Partition const & blk,
                                          bool                  unpack){
     return (dtype*)CTF_int::tensor::read(idx, prl, blk, unpack);
   }


   template<typename dtype>
   Tensor<dtype>& Tensor<dtype>::operator=(dtype val){
     set((char const*)&val);
 /*    int64_t size;
     dtype* raw = get_raw_data(&size);
     //FIXME: Uuuuh, padding?
     IASSERT(0);
     std::fill(raw, raw+size, val);*/
     return *this;
   }

   template<typename dtype>
   double Tensor<dtype>::estimate_time(
                                     CTF_int::tensor& A,
                                     const char *     idx_A,
                                     CTF_int::tensor& B,
                                     const char *     idx_B,
                                     const char *     idx_C){
     CTF_int::contraction ctr
       = CTF_int::contraction(&A, idx_A, &B, idx_B, sr->mulid(), this, idx_C, sr->addid());
     return ctr.estimate_time();
   }

   template<typename dtype>
   double Tensor<dtype>::estimate_time(
                                     CTF_int::tensor& A,
                                     const char *     idx_A,
                                     const char *     idx_B){
     CTF_int::summation sum = CTF_int::summation(&A, idx_A, sr->mulid(), this, idx_B, sr->addid());

     return sum.estimate_time();

   }

   template<typename dtype>
   Tensor<dtype>& Tensor<dtype>::operator=(Tensor<dtype> A){

     free_self();
     init(A.sr, A.order, A.lens, A.sym, A.wrld, 0, A.name, A.profile, A.is_sparse);
     copy_tensor_data(&A);
     return *this;
 /*
     sr = A.sr;
     world = A.wrld;
     name = A.name;
     if (sym != NULL)
       CTF_int::cdealloc(sym);
     if (len != NULL)
       CTF_int::cdealloc(len);
       //CTF_int::cdealloc(len);
     ret = CTF_int::tensor::info(&A, &order, &len, &sym);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function\n"); IASSERT(0); return; }
     ret = CTF_int::tensor::define(sr, order, len, sym, &tid, 1, name, name != NULL);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function\n"); IASSERT(0); return; }
     //printf("Set tensor %d to be the same as %d\n", tid, A.tid);
     ret = CTF_int::tensor::copy(A.tid, tid);
     if (ret != CTF_int::SUCCESS){ printf("CTF ERROR: failed to execute function\n"); IASSERT(0); return; }*/
   }


   template<typename dtype>
   Sparse_Tensor<dtype> Tensor<dtype>::operator[](std::vector<int64_t> indices){
     Sparse_Tensor<dtype> stsr(indices,this);
     return stsr;
   }

 }


CTF_int::SUCCESS
Definition: common.h:97

CTF_int::tensor::read
void read(int64_t num_pair, char const *alpha, char const *beta, int64_t const *inds, char *data)
read tensor data with <key, value> pairs where key is the global index for the value, which gets filled in with beta times the old values plus alpha times the values read from the tensor.
Definition: untyped_tensor.cxx:1203

CTF_int::tensor::reduce_sumabs
int reduce_sumabs(char *result)
Performs an elementwise absolute value summation reduction on a tensor.
Definition: untyped_tensor.cxx:1789

CTF::OP_SUM
Definition: common.h:51

CTF::Tensor::prnt
void prnt() const
Definition: tensor.cxx:417

CTF::Transform
Definition: functions.h:488

CTF::Tensor::profile_off
void profile_off()
turns off profiling for tensor
Definition: tensor.cxx:402

CTF::Tensor::contract
void contract(dtype alpha, CTF_int::tensor &A, char const *idx_A, CTF_int::tensor &B, char const *idx_B, dtype beta, char const *idx_C)
contracts C[idx_C] = beta*C[idx_C] + alpha*A[idx_A]*B[idx_B]

CTF::OP
OP
reduction types for tensor data deprecated types: OP_NORM1=OP_SUMABS, OP_NORM2=call norm2()...
Definition: common.h:51

CTF::Endomorphism
custom scalar function on tensor: e.g. A["ij"] = f(A["ij"])
Definition: functions.h:23

CTF::World::cdt
CTF_int::CommData cdt
communicator data for MPI comm defining this world
Definition: world.h:32

CTF::Function
Definition: functions.h:441

CTF_int::tensor::sym
int * sym
symmetries among tensor dimensions
Definition: untyped_tensor.h:74

CTF_int::contraction::execute
void execute()
run contraction
Definition: contraction.cxx:99

CTF_int::algstrct::clone
virtual algstrct * clone() const  =0
&#39;&#39;copy constructor&#39;&#39;

CTF_int::tensor::slice
void slice(int const *offsets_B, int const *ends_B, char const *beta, tensor *A, int const *offsets_A, int const *ends_A, char const *alpha)
accumulates out a slice (block) of this tensor = B B[offsets,ends)=beta*B[offsets,ends) + alpha*A[offsets_A,ends_A)
Definition: untyped_tensor.cxx:861

CTF_int::tensor::reduce_sum
int reduce_sum(char *result)
Performs an elementwise summation reduction on a tensor.
Definition: untyped_tensor.cxx:1771

CTF::Tensor::profile_on
void profile_on()
turns on profiling for tensor
Definition: tensor.cxx:397

CTF::Pair::d
dtype d
tensor value associated with index
Definition: tensor.h:34

NORM1_INST
#define NORM1_INST(dtype)
Definition: tensor.cxx:829

CTF::Ring
Ring class defined by a datatype and addition and multiplicaton functions addition must have an ident...
Definition: ring.h:18

CTF_int::algstrct::pair_alloc
virtual char * pair_alloc(int64_t n) const
allocate space for n (int64_t,dtype) pairs, necessary for object types
Definition: algstrct.cxx:681

CTF::Tensor::add_to_subworld
void add_to_subworld(Tensor< dtype > *tsr, dtype alpha, dtype beta)
accumulates this tensor to a tensor object defined on a different world
Definition: tensor.cxx:540

CTF::Tensor::i
Typ_Idx_Tensor< dtype > i(char const *idx_map)
Definition: tensor.cxx:141

CTF_int::summation::execute
void execute(bool run_diag=false)
run summation
Definition: summation.cxx:119

CTF::Tensor::get_local_pairs
void get_local_pairs(int64_t *npair, Pair< dtype > **pairs, bool nonzeros_only=false, bool unpack_sym=false) const
gives the global indices and values associated with the local data
Definition: tensor.cxx:201

CTF::Tensor::slice
Tensor< dtype > slice(int const *offsets, int const *ends) const
cuts out a slice (block) of this tensor A[offsets,ends) result will always be fully nonsymmetric ...
Definition: tensor.cxx:643

CTF::real_norm1< bool >
void real_norm1< bool >(Tensor< bool > &A, double &nrm)
Definition: tensor.cxx:812

CTF_int::tensor::profile_off
void profile_off()
turn off profiling
Definition: untyped_tensor.cxx:711

CTF_int::algstrct::is_ordered
virtual bool is_ordered() const  =0

NORM2_COMPLEX_INST
#define NORM2_COMPLEX_INST(dtype)
Definition: tensor.cxx:876

CTF::Tensor::permute
void permute(dtype beta, CTF_int::tensor &A, int *const *perms_A, dtype alpha)
Apply permutation to matrix, potentially extracting a slice B[i,j,...] = beta*B[...] + alpha*A[perms_A[0][i],perms_A[1][j],...].
Definition: tensor.cxx:429

CTF_int::get_rand48
double get_rand48()
returns new random number in [0,1)
Definition: common.cxx:27

CTF_int::tensor::sparsify
int sparsify(char const *threshold=NULL, bool take_abs=true)
reduce tensor to sparse format, storing only nonzero data, or data above a specified threshold...
Definition: untyped_tensor.cxx:1332

CTF_int::tensor::size
int64_t size
current size of local tensor data chunk (mapping-dependent)
Definition: untyped_tensor.h:98

CTF::Semiring
Semiring is a Monoid with an addition multiplicaton function addition must have an identity and be as...
Definition: semiring.h:359

CTF_int::alloc
void * alloc(int64_t len)
alloc abstraction
Definition: memcontrol.cxx:365

CTF::Tensor::reduce
dtype reduce(OP op)
performs a reduction on the tensor
Definition: tensor.cxx:731

CTF::Tensor::read_all
void read_all(int64_t *npair, dtype **data, bool unpack=false)
collects the entire tensor data on each process (not memory scalable)
Definition: tensor.cxx:377

CTF::Bivar_Function
custom bivariate function on two tensors: e.g. C["ij"] = f(A["ik"],B["kj"])
Definition: functions.h:137

NS
Definition: common.h:37

CTF::OP_MINABS
Definition: common.h:51

CTF::OP_MAX
Definition: common.h:51

CTF_int::algstrct::addid
virtual char const * addid() const
MPI datatype for pairs.
Definition: algstrct.cxx:89

CTF::World
an instance of the CTF library (world) on a MPI communicator
Definition: world.h:19

CTF::Tensor::set_name
void set_name(char const *name)
sets tensor name
Definition: tensor.cxx:392

CTF_int::tensor::is_sparse
bool is_sparse
whether only the non-zero elements of the tensor are stored
Definition: untyped_tensor.h:131

CTF_int::tensor::order
int order
number of tensor dimensions
Definition: untyped_tensor.h:76

CTF::Pair::k
int64_t k
key, global index [i1,i2,...] specified as i1+len[0]*i2+...
Definition: tensor.h:31

IASSERT
#define IASSERT(...)
Definition: common.h:74

CTF_int::PairIterator::read_val
void read_val(char *buf) const
sets external value to the value pointed by the iterator
Definition: algstrct.cxx:801

CTF::Tensor::read_local
void read_local(int64_t *npair, int64_t **global_idx, dtype **data, bool unpack_sym=false) const
Using get_local_data(), which returns an array that must be freed with delete [], is more efficient...
Definition: tensor.cxx:182

CTF::Tensor::compare
void compare(const Tensor< dtype > &A, FILE *fp=stdout, double cutoff=-1.0)
prints two sets of tensor data side-by-side to file using process 0
Definition: tensor.cxx:424

CTF::Idx_Partition
Definition: partition.h:28

world.h

CTF_int::tensor::permute
int permute(tensor *A, int *const *permutation_A, char const *alpha, int *const *permutation_B, char const *beta)
Definition: untyped_tensor.cxx:720

CTF_int::PairIterator
Definition: algstrct.h:434

CTF_int::algstrct::alloc
virtual char * alloc(int64_t n) const
allocate space for n items, necessary for object types
Definition: algstrct.cxx:685

NORM_INFTY_INST
#define NORM_INFTY_INST(dtype)
Definition: tensor.cxx:900

CTF_int::summation::estimate_time
double estimate_time()
predicts execution time in seconds using performance models
Definition: summation.cxx:132

CTF::Tensor::norm2
dtype norm2()
computes the frobenius norm of the tensor (needs sqrt()!)
Definition: tensor.h:811

CTF_int::tensor::align
int align(tensor const *B)
align mapping of thisa tensor to that of B
Definition: untyped_tensor.cxx:1749

CTF::Pair
index-value pair used for tensor data input
Definition: tensor.h:28

CTF::Tensor::read_sparse_from_file
void read_sparse_from_file(const char *fpath, bool with_vals=true)
read sparse tensor from file, entries of tensor must be stored one per line, as i_1 ...

CTF_int::tensor::wrld
CTF::World * wrld
distributed processor context on which tensor is defined
Definition: untyped_tensor.h:70

CTF::Univar_Function
custom function f : X -> Y to be applied to tensor elemetns: e.g. B["ij"] = f(A["ij"]) ...
Definition: functions.h:55

CTF::OP_MAXABS
Definition: common.h:51

ctf.core.scl
def scl(self, s)
Definition: core.pyx:473

CTF_int::scaling
class for execution distributed scaling of a tensor
Definition: scaling.h:14

CTF::Sparse_Tensor
a sparse subset of a tensor
Definition: sparse_tensor.h:14

ctf.core.a
a
Definition: core.pyx:385

CTF::OP_SUMSQ
Definition: common.h:51

CTF::OP_MIN
Definition: common.h:51

CTF::Tensor::fill_random
void fill_random(dtype rmin, dtype rmax)
fills local unique tensor elements to random values in the range [min,max] works only for dtype in {f...
Definition: tensor.cxx:928

CTF::World::rank
int rank
rank of local processor
Definition: world.h:24

CTF_int::algstrct::min
virtual void min(char const *a, char const *b, char *c) const
c = min(a,b)
Definition: algstrct.cxx:132

CTF_int::tensor::write
int write(int64_t num_pair, char const *alpha, char const *beta, char *mapped_data, char const rw='w')
Add tensor data new=alpha*new+beta*old with <key, value> pairs where key is the global index for the ...
Definition: untyped_tensor.cxx:1082

CTF_int::contraction
class for execution distributed contraction of tensors
Definition: contraction.h:16

CTF_int::tensor::print
void print(FILE *fp=stdout, char const *cutoff=NULL) const
prints tensor data to file using process 0
Definition: untyped_tensor.cxx:1825

CTF_int::tensor::zero_out_padding
int zero_out_padding()
sets padded portion of tensor to zero (this should be maintained internally)
Definition: untyped_tensor.cxx:2570

idx_tensor.h

CTF_int::tensor::lens
int * lens
unpadded tensor edge lengths
Definition: untyped_tensor.h:78

CTF_int::tensor::add_from_subworld
void add_from_subworld(tensor *tsr_sub, char const *alpha, char const *beta)
accumulates this tensor from a tensor object defined on a different world
Definition: untyped_tensor.cxx:1037

ctf.core.dtype
dtype
Definition: core.pyx:387

CTF::Tensor::norm_infty
dtype norm_infty()
finds the max absolute value element of the tensor
Definition: tensor.h:816

CTF_int::tensor::allread
int allread(int64_t *num_pair, char **all_data, bool unpack)
read entire tensor with each processor (in packed layout). WARNING: will use an &#39;unscalable&#39; amount o...
Definition: untyped_tensor.cxx:1724

CTF::Tensor::sparsify
void sparsify()
reduce tensor to sparse format, storing only nonzero data, or data above a specified threshold...
Definition: tensor.cxx:449

CTF::Tensor::~Tensor
~Tensor()
frees CTF tensor
Definition: tensor.cxx:149

CTF::Tensor::align
void align(CTF_int::tensor const &A)
aligns data mapping with tensor A
Definition: tensor.cxx:720

CTF_int::tensor::tensor
tensor()
Definition: untyped_tensor.cxx:36

CTF::Tensor::operator[]
Typ_Idx_Tensor< dtype > operator[](char const *idx_map)
associated an index map with the tensor for future operation

CTF_int::PairIterator::k
int64_t k() const
returns key of pair at head of ptr
Definition: algstrct.cxx:789

CTF_int::tensor::compare
void compare(const tensor *A, FILE *fp, char const *cutoff)
prints two sets of tensor data side-by-side to file using process 0
Definition: untyped_tensor.cxx:1930

CTF::Tensor::print
void print(FILE *fp, dtype cutoff) const
prints tensor data to file using process 0 (modify print(...) overload in set.h if you would like a d...
Definition: tensor.cxx:407

CTF_int::tensor::sr
algstrct * sr
algstrct on which tensor elements and operations are defined
Definition: untyped_tensor.h:72

CTF_int::algstrct::pair_dealloc
virtual void pair_dealloc(char *ptr) const
deallocate given pointer containing contiguous array of pairs
Definition: algstrct.cxx:693

CTF::read_sparse_from_file_base
void read_sparse_from_file_base(const char *fpath, bool with_vals, Tensor< dtype > *T)
Definition: tensor.cxx:467

CTF::Tensor::fill_sp_random
void fill_sp_random(dtype rmin, dtype rmax, double frac_sp)
generate roughly frac_sp*dense_tensor_size nonzeros between rmin and rmax, works only for dtype in {f...
Definition: tensor.cxx:969

CTF_int::contraction::estimate_time
double estimate_time()
predicts execution time in seconds using performance models
Definition: contraction.cxx:163

ctf.core.abs
def abs(initA)
Definition: core.pyx:5440

CTF::Tensor::add_from_subworld
void add_from_subworld(Tensor< dtype > *tsr, dtype alpha, dtype beta)
accumulates this tensor from a tensor object defined on a different world
Definition: tensor.cxx:560

CTF::fill_sp_random_base
void fill_sp_random_base(dtype rmin, dtype rmax, double frac_sp, Tensor< dtype > *T)
Definition: tensor.cxx:976

CTF::Typ_Idx_Tensor
Definition: idx_tensor.h:164

CTF_int::CommData::cm
MPI_Comm cm
Definition: common.h:129

CTF::Tensor::write_sparse_to_file
void write_sparse_to_file(const char *fpath, bool with_vals=true)
write sparse tensor to file, entries of tensor will be stored one per line, as i_1 ...

ctf.core.copy
def copy(tensor, A)
Definition: core.pyx:3583

CTF::real_norm1
void real_norm1(Tensor< dtype > &A, double &nrm)
Definition: tensor.cxx:803

CTF::Tensor::get_local_data
void get_local_data(int64_t *npair, int64_t **global_idx, dtype **data, bool nonzeros_only=false, bool unpack_sym=false) const
Gives the global indices and values associated with the local data.
Definition: tensor.cxx:159

CTF::Tensor::Tensor
Tensor()
default constructor
Definition: tensor.cxx:12

ctf.core.tsr
tsr
Definition: core.pyx:443

CTF_int::algstrct::max
virtual void max(char const *a, char const *b, char *c) const
c = max(a,b)
Definition: algstrct.cxx:138

CTF::fill_random_base
void fill_random_base(dtype rmin, dtype rmax, Tensor< dtype > &T)
Definition: tensor.cxx:935

CTF_int::tensor::add_to_subworld
void add_to_subworld(tensor *tsr_sub, char const *alpha, char const *beta)
accumulates this tensor to a tensor object defined on a different world
Definition: untyped_tensor.cxx:991

CTF_int::accumulatable::el_size
int el_size
size of each element of algstrct in bytes
Definition: algstrct.h:16

CTF::OP_SUMABS
Definition: common.h:51

CTF_int::tensor::profile
bool profile
whether profiling should be done for contractions/sums involving this tensor
Definition: untyped_tensor.h:129

CTF_int::cdealloc
int cdealloc(void *ptr)
free abstraction
Definition: memcontrol.cxx:480

CTF::Tensor::get_raw_data
dtype * get_raw_data(int64_t *size) const
gives the raw current local data with padding included
Definition: tensor.cxx:152

CTF_int::algstrct
algstrct (algebraic structure) defines the elementwise operations computed in each tensor contraction...
Definition: algstrct.h:34

CTF
Definition: apsp.cxx:17

CTF::Tensor::sum
void sum(dtype alpha, CTF_int::tensor &A, char const *idx_A, dtype beta, char const *idx_B)
sums B[idx_B] = beta*B[idx_B] + alpha*A[idx_A]

CTF_int::tensor::data
char * data
tensor data, either the data or the key-value pairs should exist at any given time ...
Definition: untyped_tensor.h:117

CTF::Monoid
A Monoid is a Set equipped with a binary addition operator &#39;+&#39; or a custom function addition must hav...
Definition: monoid.h:69

CTF_int::tensor
internal distributed tensor class
Definition: untyped_tensor.h:20

CTF::Tensor::norm1
dtype norm1()
computes the entrywise 1-norm of the tensor
Definition: tensor.h:806

CTF_int::tensor::profile_on
void profile_on()
turn on profiling
Definition: untyped_tensor.cxx:707

CTF::Tensor::get_mapped_data
dtype * get_mapped_data(char const *idx, Idx_Partition const &prl, Idx_Partition const &blk=Idx_Partition(), bool unpack=true)
returns local data of tensor with parallel distribution prl and local blocking blk ...
Definition: tensor.cxx:1129

CTF::Tensor
an instance of a tensor within a CTF world
Definition: tensor.h:74

CTF_int::scaling::execute
int execute()
run scaling
Definition: scaling.cxx:64

CTF::Tensor::read
void read(int64_t npair, Pair< dtype > *pairs)
Gives the values associated with any set of indices.
Definition: tensor.cxx:246

CTF::Tensor::scale
void scale(dtype alpha, char const *idx_A)
scales A[idx_A] = alpha*A[idx_A]

CTF::Tensor::operator=
Tensor< dtype > & operator=(dtype val)
sets all values in the tensor to val
Definition: tensor.cxx:1139

NORM2_REAL_INST
#define NORM2_REAL_INST(dtype)
Definition: tensor.cxx:870

CTF_int::summation
class for execution distributed summation of tensors
Definition: summation.h:15

CTF_int::tensor::read_local_nnz
int read_local_nnz(int64_t *num_pair, char **mapped_data, bool unpack_sym=false) const
read tensor data pairs local to processor that have nonzero values
Definition: untyped_tensor.cxx:1538

CTF::Tensor::estimate_time
double estimate_time(CTF_int::tensor &A, char const *idx_A, CTF_int::tensor &B, char const *idx_B, char const *idx_C)
estimate the time of a contraction C[idx_C] = A[idx_A]*B[idx_B]

CTF_int::tensor::free_self
void free_self()
destructor
Definition: untyped_tensor.cxx:40

CTF_int
Definition: model_trainer.cxx:16

CTF_int::algstrct::mulid
virtual char const * mulid() const
identity element for multiplication i.e. 1
Definition: algstrct.cxx:93

CTF_int::tensor::reduce_sumsq
int reduce_sumsq(char *result)
computes the sum of squares of the elements
Definition: untyped_tensor.cxx:1808

CTF::write_sparse_to_file_base
void write_sparse_to_file_base(const char *fpath, bool with_vals, Tensor< dtype > *T)
Definition: tensor.cxx:506

CTF_int::tensor::copy_tensor_data
void copy_tensor_data(tensor const *other)
copies all tensor data from other
Definition: untyped_tensor.cxx:210

CTF_int::tensor::set_name
void set_name(char const *name)
set the tensor name
Definition: untyped_tensor.cxx:697

CTF::Tensor::write
void write(int64_t npair, int64_t const *global_idx, dtype const *data)
writes in values associated with any set of indices The sparse data is defined in coordinate format...
Definition: tensor.cxx:264

CTF_int::tensor::name
char * name
name given to tensor
Definition: untyped_tensor.h:84

CTF::World::np
int np
number of processors
Definition: world.h:26

CTF_int::tensor::init
void init(algstrct const *sr, int order, int const *edge_len, int const *sym, CTF::World *wrld, bool alloc_data, char const *name, bool profile, bool is_sparse)
initializes tensor data
Definition: untyped_tensor.cxx:306

CTF::World::comm
MPI_Comm comm
set of processors making up this world
Definition: world.h:22

CTF::Tensor::get_max_abs
void get_max_abs(int n, dtype *data) const
obtains a small number of the biggest elements of the tensor in sorted order (e.g. eigenvalues)
Definition: tensor.cxx:920

CTF_int::tensor::read_local
int read_local(int64_t *num_pair, char **mapped_data, bool unpack_sym=false) const
read tensor data pairs local to processor including those with zero values WARNING: for sparse tensor...
Definition: untyped_tensor.cxx:1553

CTF_int::tensor::get_max_abs
int get_max_abs(int n, char *data) const
obtains the largest n elements (in absolute value) of the tensor

CTF_int::cvrt_idx
void cvrt_idx(int order, int const *lens, int64_t idx, int *idx_arr)
Definition: common.cxx:533