ctf/untyped__tensor_8h_source.html

 /*Copyright (c) 2011, Edgar Solomonik, all rights reserved.*/

 #ifndef __UNTYPED_TENSOR_H__
 #define __UNTYPED_TENSOR_H__

 #include "../mapping/mapping.h"
 #include "../mapping/distribution.h"
 #include "../interface/world.h"
 #include "../interface/partition.h"
 #include "algstrct.h"
 #include <functional>

 namespace CTF {
   class Idx_Tensor;
 }

 namespace CTF_int {

   class tensor {
     protected:
       void init(algstrct const * sr,
                 int              order,
                 int const *      edge_len,
                 int const *      sym,
                 CTF::World *     wrld,
                 bool             alloc_data,
                 char const *     name,
                 bool             profile,
                 bool             is_sparse);
       PairIterator read_all_pairs(int64_t * num_pair, bool unpack);

       void copy_tensor_data(tensor const * other);

       void set_distribution(char const *               idx,
                             CTF::Idx_Partition const & prl,
                             CTF::Idx_Partition const & blk);

     public:

       CTF::World * wrld;
       algstrct * sr;
       int * sym;
       int order;
       int * lens;
       int * pad_edge_len;
       int * padding;
       char * name;
       int is_scp_padded;
       int * scp_padding;
       int * sym_table;
       bool is_mapped;
       topology * topo;
       mapping * edge_map;
       int64_t size;
       int64_t registered_alloc_size;
       bool is_folded;
       int * inner_ordering;
       tensor * rec_tsr;
       bool is_cyclic;
       bool is_data_aliased;
       tensor * slay;
       bool has_zero_edge_len;
       char * data;
       bool has_home;
       char * home_buffer;
       int64_t home_size;
       bool is_home;
       bool left_home_transp;
       bool profile;
       bool is_sparse;
       bool is_csr;
       int nrow_idx;
       int64_t nnz_loc;
       int64_t nnz_tot;
       int64_t * nnz_blk;

       CTF::Idx_Tensor operator[](char const * idx_map);

       tensor();

       ~tensor();

       void free_self();

       tensor(algstrct const * sr,
              int              order,
              int const *      edge_len,
              int const *      sym,
              CTF::World *     wrld,
              bool             alloc_data=true,
              char const *     name=NULL,
              bool             profile=1,
              bool             is_sparse=0);

       tensor(algstrct const *           sr,
              int                        order,
              bool                       is_sparse,
              int const *                edge_len,
              int const *                sym,
              CTF::World *               wrld,
              char const *               idx,
              CTF::Idx_Partition const & prl,
              CTF::Idx_Partition const & blk,
              char const *               name=NULL,
              bool                       profile=1);

       tensor(tensor const * other, bool copy = 1, bool alloc_data = 1);

       tensor(tensor * other, int const * new_sym);

       int * calc_phase() const;

       int calc_tot_phase() const;

       int64_t calc_nvirt() const;

       int64_t calc_npe() const;


       void set_padding();

       int set_zero();

       int set(char const * val);

       int zero_out_padding();

       void scale_diagonals(int const * sym_mask);

       // apply an additive inverse to all elements of the tensor
       void addinv();

       void print_map(FILE * stream=stdout, bool allcall=1) const;

       void set_name(char const * name);

       char const * get_name() const;

       void profile_on();

       void profile_off();


       void get_raw_data(char ** data, int64_t * size) const;

        int write(int64_t      num_pair,
                  char const * alpha,
                  char const * beta,
                  char *       mapped_data,
                  char const   rw='w');

         void write(int64_t         num_pair,
                    char const *    alpha,
                    char const *    beta,
                    int64_t const * inds,
                    char const *    data);

       void read(int64_t         num_pair,
                 char const *    alpha,
                 char const *    beta,
                 int64_t const * inds,
                 char *          data);

       int read(int64_t      num_pair,
                char const * alpha,
                char const * beta,
                char *       mapped_data);


       char * read(char const *               idx,
                   CTF::Idx_Partition const & prl,
                   CTF::Idx_Partition const & blk,
                   bool                       unpack);

       int read(int64_t num_pair,
                char *  mapped_data);

       int64_t get_tot_size(bool packed);

       int allread(int64_t * num_pair,
                   char **   all_data,
                   bool      unpack);

       int allread(int64_t * num_pair,
                   char *    all_data,
                   bool      unpack=true);

       void slice(int const *  offsets_B,
                  int const *  ends_B,
                  char const * beta,
                  tensor  *    A,
                  int const *  offsets_A,
                  int const *  ends_A,
                  char const * alpha);

       /* Same as above, except tid_B lives on dt_other_B */
 /*      int slice_tensor(int            tid_A,
                        int const *    offsets_A,
                        int const *    ends_A,
                        char const *   alpha,
                        int            tid_B,
                        int const *    offsets_B,
                        int const *    ends_B,
                        char const *   beta,
                        world *        dt_other_B);
 */
       int permute(tensor *      A,
                   int * const * permutation_A,
                   char const *  alpha,
                   int * const * permutation_B,
                   char const *  beta);

       int sparsify(char const * threshold=NULL,
                    bool         take_abs=true);

       int sparsify(std::function<bool(char const*)> f);

       int read_local(int64_t * num_pair,
                      char **   mapped_data,
                      bool      unpack_sym=false) const;

       int read_local_nnz(int64_t * num_pair,
                          char **   mapped_data,
                          bool      unpack_sym=false) const;

       void read_local(int64_t *  num_pair,
                       int64_t ** inds,
                       char **    data,
                       bool       unpack_sym=false) const;

       void read_local_nnz(int64_t * num_pair,
                           int64_t ** inds,
                           char **    data,
                           bool      unpack_sym=false) const;


       //int copy(tensor * A);

       int align(tensor const * B);

       /* product will contain the dot prodiuct if tsr_A and tsr_B */
       //int dot_tensor(int tid_A, int tid_B, char *product);

       int reduce_sum(char * result);

       int reduce_sum(char * result, algstrct const * sr_other);

       int reduce_sumabs(char * result);

       int reduce_sumabs(char * result, algstrct const * sr_other) ;


       int reduce_sumsq(char * result);

       /* map data of tid_A with the given function */
 /*      int map_tensor(int tid,
                      dtype (*map_func)(int order,
                                        int const * indices,
                                        dtype elem));*/
       int get_max_abs(int n, char * data) const;

       void print(FILE * fp = stdout, char const * cutoff = NULL) const;
       void prnt() const;

       void compare(const tensor * A, FILE * fp, char const * cutoff);

       void orient_subworld(CTF::World *    greater_world,
                            int &           bw_mirror_rank,
                            int &           fw_mirror_rank,
                            distribution *& odst,
                            char **         sub_buffer_);

       void add_to_subworld(tensor *     tsr_sub,
                            char const * alpha,
                            char const * beta);

       void add_from_subworld(tensor *     tsr_sub,
                              char const * alpha,
                              char const * beta);

       void unfold(bool was_mod=0);

       void remove_fold();


       double est_time_unfold();


       void fold(int         nfold,
                 int const * fold_idx,
                 int const * idx_map,
                 int *       all_fdim,
                 int **      all_flen);

       void pull_alias(tensor const * other);


       void clear_mapping();


       int redistribute(distribution const & old_dist,
                        int const *  old_offsets = NULL,
                        int * const * old_permutation = NULL,
                        int const *  new_offsets = NULL,
                        int * const * new_permutation = NULL);

       double est_redist_time(distribution const & old_dist, double nnz_frac);

       int64_t get_redist_mem(distribution const & old_dist, double nnz_frac);

       int map_tensor_rem(int        num_phys_dims,
                          CommData * phys_comm,
                          int        fill=0);

       int extract_diag(int const * idx_map,
                        int         rw,
                        tensor *&   new_tsr,
                        int **      idx_map_new);

       void set_sym(int const * sym);

       void set_new_nnz_glb(int64_t const * nnz_blk);

       void spmatricize(int m, int n, int nrow_idx, bool csr);

       void despmatricize(int nrow_idx, bool csr);

       void leave_home_with_buffer();

       void register_size(int64_t size);

       void deregister_size();

       void write_dense_to_file(MPI_File & file, int64_t offset=0);

       void write_dense_to_file(char const * filename);

       void read_dense_from_file(MPI_File & file, int64_t offset=0);


       void read_dense_from_file(char const * filename);

       template <typename dtype_A, typename dtype_B>
       void conv_type(tensor * B);

       template <typename dtype_A, typename dtype_B>
       void exp_helper(tensor * A);

       template <typename dtype>
       void compare_elementwise(tensor * A, tensor * B);

       template <typename dtype>
       void not_equals(tensor * A, tensor * B);

       template <typename dtype>
       void smaller_than(tensor * A, tensor * B);

       template <typename dtype>
       void smaller_equal_than(tensor * A, tensor * B);

       template <typename dtype>
       void larger_than(tensor * A, tensor * B);

       template <typename dtype>
       void larger_equal_than(tensor * A, tensor * B);

       template <typename dtype>
       void true_divide(tensor * A);

       tensor * self_reduce(int const * idx_A,
                            int **      new_idx_A,
                            int         order_B,
                            int const * idx_B,
                            int **      new_idx_B,
                            int         order_C=0,
                            int const * idx_C=NULL,
                            int **      new_idx_C=NULL);
   };
 }
 #endif// __UNTYPED_TENSOR_H__
CTF_int::permute
void permute(int order, int const *perm, int *arr)
permute an array
Definition: util.cxx:205

CTF_int::tensor::home_buffer
char * home_buffer
buffer associated with home mapping of tensor, to which it is returned
Definition: untyped_tensor.h:121

CTF_int::tensor::is_home
bool is_home
whether the latest tensor data is in the home buffer
Definition: untyped_tensor.h:125

CTF_int::tensor::nnz_blk
int64_t * nnz_blk
nonzero elements in each block owned locally
Definition: untyped_tensor.h:141

CTF_int::tensor::sym
int * sym
symmetries among tensor dimensions
Definition: untyped_tensor.h:74

CTF_int::tensor::pad_edge_len
int * pad_edge_len
padded tensor edge lengths
Definition: untyped_tensor.h:80

CTF_int::tensor::inner_ordering
int * inner_ordering
ordering of the dimensions according to which the tensori s folded
Definition: untyped_tensor.h:104

ctf.core.conv_type
def conv_type(self, dtype)
Definition: core.pyx:363

CTF_int::tensor::has_home
bool has_home
whether the tensor has a home mapping/buffer
Definition: untyped_tensor.h:119

algstrct.h

CTF_int::CommData
Definition: common.h:127

CTF_int::tensor::size
int64_t size
current size of local tensor data chunk (mapping-dependent)
Definition: untyped_tensor.h:98

CTF_int::tensor::is_csr
bool is_csr
whether CSR or COO if folded
Definition: untyped_tensor.h:133

CTF_int::tensor::is_folded
bool is_folded
whether the data is folded/transposed into a (lower-order) tensor
Definition: untyped_tensor.h:102

CTF_int::tensor::home_size
int64_t home_size
size of home buffer
Definition: untyped_tensor.h:123

CTF::World
an instance of the CTF library (world) on a MPI communicator
Definition: world.h:19

CTF_int::tensor::is_sparse
bool is_sparse
whether only the non-zero elements of the tensor are stored
Definition: untyped_tensor.h:131

CTF_int::tensor::order
int order
number of tensor dimensions
Definition: untyped_tensor.h:76

CTF::Idx_Partition
Definition: partition.h:28

CTF_int::PairIterator
Definition: algstrct.h:434

CTF_int::tensor::wrld
CTF::World * wrld
distributed processor context on which tensor is defined
Definition: untyped_tensor.h:70

CTF_int::tensor::is_scp_padded
int is_scp_padded
whether tensor data has additional padding
Definition: untyped_tensor.h:86

CTF_int::tensor::is_cyclic
bool is_cyclic
whether the tensor data is cyclically distributed (blocked if false)
Definition: untyped_tensor.h:108

CTF_int::tensor::padding
int * padding
padding along each edge length (less than distribution phase)
Definition: untyped_tensor.h:82

CTF_int::tensor::lens
int * lens
unpadded tensor edge lengths
Definition: untyped_tensor.h:78

CTF_int::tensor::nrow_idx
int nrow_idx
how many modes are folded into matricized row
Definition: untyped_tensor.h:135

CTF_int::mapping
Definition: mapping.h:20

CTF_int::tensor::is_data_aliased
bool is_data_aliased
whether the tensor data is an alias of another tensor object&#39;s data
Definition: untyped_tensor.h:110

CTF_int::tensor::nnz_tot
int64_t nnz_tot
maximum number of local nonzero elements over all procs
Definition: untyped_tensor.h:139

CTF_int::tensor::sr
algstrct * sr
algstrct on which tensor elements and operations are defined
Definition: untyped_tensor.h:72

CTF_int::tensor::edge_map
mapping * edge_map
mappings of each tensor dimension onto topology dimensions
Definition: untyped_tensor.h:96

CTF_int::tensor::rec_tsr
tensor * rec_tsr
representation of folded tensor (shares data pointer)
Definition: untyped_tensor.h:106

CTF_int::tensor::left_home_transp
bool left_home_transp
whether the tensor left home to transpose
Definition: untyped_tensor.h:127

CTF_int::tensor::is_mapped
bool is_mapped
whether a mapping has been selected
Definition: untyped_tensor.h:92

CTF_int::tensor::registered_alloc_size
int64_t registered_alloc_size
size CTF keeps track of for memory usage
Definition: untyped_tensor.h:100

CTF_int::tensor::sym_table
int * sym_table
order-by-order table of dimensional symmetry relations
Definition: untyped_tensor.h:90

ctf.core.copy
def copy(tensor, A)
Definition: core.pyx:3583

CTF_int::tensor::scp_padding
int * scp_padding
additional padding, may be greater than ScaLAPACK phase
Definition: untyped_tensor.h:88

CTF_int::tensor::nnz_loc
int64_t nnz_loc
number of local nonzero elements
Definition: untyped_tensor.h:137

CTF_int::tensor::profile
bool profile
whether profiling should be done for contractions/sums involving this tensor
Definition: untyped_tensor.h:129

CTF_int::algstrct
algstrct (algebraic structure) defines the elementwise operations computed in each tensor contraction...
Definition: algstrct.h:34

CTF
Definition: apsp.cxx:17

CTF_int::tensor::data
char * data
tensor data, either the data or the key-value pairs should exist at any given time ...
Definition: untyped_tensor.h:117

CTF_int::tensor
internal distributed tensor class
Definition: untyped_tensor.h:20

CTF_int::distribution
Definition: distribution.h:18

CTF_int::tensor::topo
topology * topo
topology to which the tensor is mapped
Definition: untyped_tensor.h:94

CTF_int::tensor::has_zero_edge_len
bool has_zero_edge_len
if true tensor has a zero edge length, so is zero, which short-cuts stuff
Definition: untyped_tensor.h:115

CTF_int
Definition: model_trainer.cxx:16

CTF_int::topology
Definition: topology.h:14

CTF::Idx_Tensor
a tensor with an index map associated with it (necessary for overloaded operators) ...
Definition: idx_tensor.h:15

CTF_int::tensor::slay
tensor * slay
tensor object associated with tensor object whose data pointer needs to be preserved, needed for ScaLAPACK wrapper FIXME: home buffer should presumably take care of this...
Definition: untyped_tensor.h:113

CTF_int::tensor::name
char * name
name given to tensor
Definition: untyped_tensor.h:84