Grid/dev/Tensor__arith__mac_8h_source.html

/*************************************************************************************


    Grid physics library, www.github.com/paboyle/Grid


    Source file: ./lib/tensors/Tensor_arith_mac.h


    Copyright (C) 2015


Author: Peter Boyle <paboyle@ph.ed.ac.uk>


    This program is free software; you can redistribute it and/or modify

    it under the terms of the GNU General Public License as published by

    the Free Software Foundation; either version 2 of the License, or

    (at your option) any later version.


    This program is distributed in the hope that it will be useful,

    but WITHOUT ANY WARRANTY; without even the implied warranty of

    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

    GNU General Public License for more details.


    You should have received a copy of the GNU General Public License along

    with this program; if not, write to the Free Software Foundation, Inc.,

    51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.


    See the full license in the file "LICENSE" in the top level distribution directory

*************************************************************************************/

/*  END LEGAL */

#ifndef GRID_MATH_ARITH_MAC_H

#define GRID_MATH_ARITH_MAC_H


NAMESPACE_BEGIN(Grid);


// Legal multiplication table

// scal x scal = scal

// mat x  mat  = mat

// mat  x scal = mat

// scal x mat  = mat

// mat  x vec  = vec

// vec  x scal = vec

// scal x vec  = vec

template<class rtype,class vtype,class mtype>


accelerator_inline  void mac(iScalar<rtype> * __restrict__ ret,const iScalar<vtype> * __restrict__ lhs,const iScalar<mtype> * __restrict__ rhs)

{

  mac(&ret->_internal,&lhs->_internal,&rhs->_internal);

}


template<class rrtype,class ltype,class rtype,int N>


accelerator_inline void mac(iMatrix<rrtype,N> * __restrict__ ret,const iMatrix<ltype,N> * __restrict__ lhs,const iMatrix<rtype,N> * __restrict__ rhs){

  for(int c3=0;c3<N;c3++){

    for(int c1=0;c1<N;c1++){

      for(int c2=0;c2<N;c2++){

        mac(&ret->_internal[c1][c2],&lhs->_internal[c1][c3],&rhs->_internal[c3][c2]);

      }}}

  return;

}


template<class rrtype,class ltype,class rtype,int N>


accelerator_inline void mac(iMatrix<rrtype,N> * __restrict__ ret,const iMatrix<ltype,N> * __restrict__ lhs,const iScalar<rtype> * __restrict__ rhs){

  for(int c1=0;c1<N;c1++){

    for(int c2=0;c2<N;c2++){

      mac(&ret->_internal[c1][c2],&lhs->_internal[c1][c2],&rhs->_internal);

    }}

  return;

}


template<class rrtype,class ltype,class rtype,int N>


accelerator_inline void mac(iMatrix<rrtype,N> * __restrict__ ret,const iScalar<ltype> * __restrict__ lhs,const iMatrix<rtype,N> * __restrict__ rhs){

  for(int c1=0;c1<N;c1++){

    for(int c2=0;c2<N;c2++){

      mac(&ret->_internal[c1][c2],&lhs->_internal,&rhs->_internal[c1][c2]);

    }}

  return;

}


template<class rrtype,class ltype,class rtype,int N>


accelerator_inline void mac(iVector<rrtype,N> * __restrict__ ret,const iMatrix<ltype,N> * __restrict__ lhs,const iVector<rtype,N> * __restrict__ rhs)

{

  for(int c1=0;c1<N;c1++){

    for(int c2=0;c2<N;c2++){

      mac(&ret->_internal[c1],&lhs->_internal[c1][c2],&rhs->_internal[c2]);

    }}

  return;

}


template<class rrtype,class ltype,class rtype,int N>


accelerator_inline void mac(iVector<rrtype,N> * __restrict__ ret,const iScalar<ltype> * __restrict__ lhs,const iVector<rtype,N> * __restrict__ rhs)

{

  for(int c1=0;c1<N;c1++){

    mac(&ret->_internal[c1],&lhs->_internal,&rhs->_internal[c1]);

  }

  return;

}


template<class rrtype,class ltype,class rtype,int N>


accelerator_inline void mac(iVector<rrtype,N> * __restrict__ ret,const iVector<ltype,N> * __restrict__ lhs,const iScalar<rtype> * __restrict__ rhs)

{

  for(int c1=0;c1<N;c1++){

    mac(&ret->_internal[c1],&lhs->_internal[c1],&rhs->_internal);

  }

  return;

}


NAMESPACE_END(Grid);


#endif

accelerator_inline
#define accelerator_inline
Definition Accelerator.h:608

NAMESPACE_BEGIN
#define NAMESPACE_BEGIN(A)
Definition Namespace.h:35

NAMESPACE_END
#define NAMESPACE_END(A)
Definition Namespace.h:36

mac
accelerator_inline void mac(iScalar< rtype > *__restrict__ ret, const iScalar< vtype > *__restrict__ lhs, const iScalar< mtype > *__restrict__ rhs)
Definition Tensor_arith_mac.h:50

iMatrix
Definition Tensor_class.h:301

iMatrix::_internal
vtype _internal[N][N]
Definition Tensor_class.h:303

iScalar
Definition Tensor_class.h:77

iScalar::_internal
vtype _internal
Definition Tensor_class.h:79

iVector
Definition Tensor_class.h:189

iVector::_internal
vtype _internal[N]
Definition Tensor_class.h:191

Grid
Definition Deflation.h:31