ctf/sym__seq__scl_8cxx_source.html

 /*Copyright (c) 2011, Edgar Solomonik, all rights reserved.*/

 #include "../shared/iter_tsr.h"
 #include "../shared/util.h"
 #include <limits.h>
 #include "sym_seq_scl.h"
 #include "scaling.h"
 #include "../interface/idx_tensor.h"

 namespace CTF_int {

   void endomorphism::operator()(Term const & A) const {
     CTF::Idx_Tensor op_A = A.execute(A.get_uniq_inds());
     scaling s(op_A.parent, op_A.idx_map, op_A.scale, this);
     s.execute();
   }


   void inv_idx(int const   order_A,
                int const * idx_A,
                int *       order_tot,
                int **      idx_arr){
     int i, dim_max;

     dim_max = -1;
     for (i=0; i<order_A; i++){
       if (idx_A[i] > dim_max) dim_max = idx_A[i];
     }
     dim_max++;
     *order_tot = dim_max;
     *idx_arr = (int*)CTF_int::alloc(sizeof(int)*dim_max);
     std::fill((*idx_arr), (*idx_arr)+dim_max, -1);

     for (i=0; i<order_A; i++){
       (*idx_arr)[idx_A[i]] = i;
     }
   }


   int sym_seq_scl_ref(char const *     alpha,
                       char *           A,
                       algstrct const * sr_A,
                       int              order_A,
                       int const *      edge_len_A,
                       int const *      sym_A,
                       int const *      idx_map_A){
     TAU_FSTART(sym_seq_sum_ref);
     int idx, i, idx_max, imin, imax, iA, j, k;
     int off_idx, sym_pass;
     int * idx_glb, * rev_idx_map;
     int * dlen_A;
     int64_t idx_A, off_lda;

     inv_idx(order_A,       idx_map_A,
             &idx_max,     &rev_idx_map);

     dlen_A = (int*)CTF_int::alloc(sizeof(int)*order_A);
     memcpy(dlen_A, edge_len_A, sizeof(int)*order_A);

     idx_glb = (int*)CTF_int::alloc(sizeof(int)*idx_max);
     memset(idx_glb, 0, sizeof(int)*idx_max);


     idx_A = 0;
     sym_pass = 1;
     for (;;){
       if (sym_pass){
         //A[idx_A] = alpha*A[idx_A];
         sr_A->mul(A+idx_A*sr_A->el_size, alpha, A+idx_A*sr_A->el_size);
         CTF_FLOPS_ADD(1);
       }

       for (idx=0; idx<idx_max; idx++){
         imin = 0, imax = INT_MAX;

         GET_MIN_MAX(A,0,1);

         ASSERT(idx_glb[idx] >= imin && idx_glb[idx] < imax);

         idx_glb[idx]++;

         if (idx_glb[idx] >= imax){
                 idx_glb[idx] = imin;
         }
         if (idx_glb[idx] != imin) {
                 break;
         }
       }
       if (idx == idx_max) break;

       CHECK_SYM(A);
       if (!sym_pass) continue;

       if (order_A > 0)
         RESET_IDX(A);
     }
     CTF_int::cdealloc(dlen_A);
     CTF_int::cdealloc(idx_glb);
     CTF_int::cdealloc(rev_idx_map);
     TAU_FSTOP(sym_seq_sum_ref);
     return 0;
   }


   int sym_seq_scl_cust(char const *         alpha,
                        char *               A,
                        algstrct const *     sr_A,
                        int const            order_A,
                        int const *          edge_len_A,
                        int const *          sym_A,
                        int const *          idx_map_A,
                        endomorphism const * func){
     TAU_FSTART(sym_seq_sum_cust)
     int idx, i, idx_max, imin, imax, iA, j, k;
     int off_idx, sym_pass;
     int * idx_glb, * rev_idx_map;
     int * dlen_A;
     int64_t idx_A, off_lda;

     inv_idx(order_A,       idx_map_A,
             &idx_max,     &rev_idx_map);

     dlen_A = (int*)CTF_int::alloc(sizeof(int)*order_A);
     memcpy(dlen_A, edge_len_A, sizeof(int)*order_A);

     idx_glb = (int*)CTF_int::alloc(sizeof(int)*idx_max);
     memset(idx_glb, 0, sizeof(int)*idx_max);


     idx_A = 0;
     sym_pass = 1;
     for (;;){
       if (sym_pass){
         if (alpha != NULL)
           sr_A->mul(A+idx_A*sr_A->el_size, alpha, A+idx_A*sr_A->el_size);
         func->apply_f(A+idx_A*sr_A->el_size);
         CTF_FLOPS_ADD(1);
       }

       for (idx=0; idx<idx_max; idx++){
         imin = 0, imax = INT_MAX;

         GET_MIN_MAX(A,0,1);

         ASSERT(idx_glb[idx] >= imin && idx_glb[idx] < imax);

         idx_glb[idx]++;

         if (idx_glb[idx] >= imax){
                 idx_glb[idx] = imin;
         }
         if (idx_glb[idx] != imin) {
                 break;
         }
       }
       if (idx == idx_max) break;

       CHECK_SYM(A);
       if (!sym_pass) continue;

       if (order_A > 0)
         RESET_IDX(A);
     }
     CTF_int::cdealloc(dlen_A);
     CTF_int::cdealloc(idx_glb);
     CTF_int::cdealloc(rev_idx_map);
     TAU_FSTOP(sym_seq_sum_cust);
     return 0;
   }


 }
CTF_int::Term
a term is an abstract object representing some expression of tensors
Definition: term.h:33

scaling.h

CTF_int::Term::execute
virtual void execute(CTF::Idx_Tensor output) const  =0
evalues the expression, which just scales by default

CTF_int::endomorphism
untyped internal class for singly-typed single variable function (Endomorphism)
Definition: sym_seq_scl.h:12

RESET_IDX
#define RESET_IDX(__X)
Definition: iter_tsr.h:67

CTF_int::sym_seq_sum_ref
int sym_seq_sum_ref(char const *alpha, char const *A, algstrct const *sr_A, int order_A, int const *edge_len_A, int const *sym_A, int const *idx_map_A, char const *beta, char *B, algstrct const *sr_B, int order_B, int const *edge_len_B, int const *sym_B, int const *idx_map_B)
performs symmetric contraction with unblocked reference kernel
Definition: sym_seq_sum.cxx:292

CTF::Idx_Tensor::idx_map
char * idx_map
Definition: idx_tensor.h:18

CTF_int::inv_idx
void inv_idx(int order_A, int const *idx_A, int order_B, int const *idx_B, int order_C, int const *idx_C, int *order_tot, int **idx_arr)
invert index map
Definition: ctr_tsr.cxx:592

ASSERT
#define ASSERT(...)
Definition: util.h:88

CTF_int::alloc
void * alloc(int64_t len)
alloc abstraction
Definition: memcontrol.cxx:365

GET_MIN_MAX
#define GET_MIN_MAX(__X, nr, wd)
Definition: iter_tsr.h:16

CTF_FLOPS_ADD
#define CTF_FLOPS_ADD(n)
Definition: util.h:138

CTF_int::endomorphism::apply_f
virtual void apply_f(char *a) const
apply function f to value stored at a
Definition: sym_seq_scl.h:19

CTF_int::scaling
class for execution distributed scaling of a tensor
Definition: scaling.h:14

CTF_int::sym_seq_scl_ref
int sym_seq_scl_ref(char const *alpha, char *A, algstrct const *sr_A, int order_A, int const *edge_len_A, int const *sym_A, int const *idx_map_A)
performs symmetric scaling using algstrct const * sr_A
Definition: sym_seq_scl.cxx:40

TAU_FSTOP
#define TAU_FSTOP(ARG)
Definition: util.h:281

CTF_int::sym_seq_scl_cust
int sym_seq_scl_cust(char const *alpha, char *A, algstrct const *sr_A, int const order_A, int const *edge_len_A, int const *sym_A, int const *idx_map_A, endomorphism const *func)
performs symmetric scaling using custom func
Definition: sym_seq_scl.cxx:105

TAU_FSTART
#define TAU_FSTART(ARG)
Definition: util.h:280

CHECK_SYM
#define CHECK_SYM(__X)
Definition: iter_tsr.h:52

CTF_int::Term::get_uniq_inds
virtual std::vector< char > get_uniq_inds() const  =0
find list of unique indices that are involved in this term

CTF_int::sym_seq_sum_cust
int sym_seq_sum_cust(char const *alpha, char const *A, algstrct const *sr_A, int order_A, int const *edge_len_A, int const *sym_A, int const *idx_map_A, char const *beta, char *B, algstrct const *sr_B, int order_B, int const *edge_len_B, int const *sym_B, int const *idx_map_B, univar_function const *func)
performs symmetric summation with custom elementwise function
Definition: sym_seq_sum.cxx:524

CTF_int::accumulatable::el_size
int el_size
size of each element of algstrct in bytes
Definition: algstrct.h:16

CTF_int::cdealloc
int cdealloc(void *ptr)
free abstraction
Definition: memcontrol.cxx:480

sym_seq_scl.h

CTF_int::algstrct
algstrct (algebraic structure) defines the elementwise operations computed in each tensor contraction...
Definition: algstrct.h:34

CTF_int::scaling::execute
int execute()
run scaling
Definition: scaling.cxx:64

CTF_int::Term::scale
char * scale
Definition: term.h:35

CTF_int::endomorphism::operator()
void operator()(Term const &A) const
apply f to A
Definition: sym_seq_scl.cxx:12

CTF_int::algstrct::mul
virtual void mul(char const *a, char const *b, char *c) const
c = a*b
Definition: algstrct.cxx:120

CTF_int
Definition: model_trainer.cxx:16

CTF::Idx_Tensor
a tensor with an index map associated with it (necessary for overloaded operators) ...
Definition: idx_tensor.h:15

CTF::Idx_Tensor::parent
CTF_int::tensor * parent
Definition: idx_tensor.h:17