doc/html/Stokhos__LinearSparse3Tensor_8hpp_source.html

 // @HEADER

 // ***********************************************************************

 //

 //                           Stokhos Package

 //                 Copyright (2009) Sandia Corporation

 //

 // Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive

 // license for use of this work by or on behalf of the U.S. Government.

 //

 // Redistribution and use in source and binary forms, with or without

 // modification, are permitted provided that the following conditions are

 // met:

 //

 // 1. Redistributions of source code must retain the above copyright

 // notice, this list of conditions and the following disclaimer.

 //

 // 2. Redistributions in binary form must reproduce the above copyright

 // notice, this list of conditions and the following disclaimer in the

 // documentation and/or other materials provided with the distribution.

 //

 // 3. Neither the name of the Corporation nor the names of the

 // contributors may be used to endorse or promote products derived from

 // this software without specific prior written permission.

 //

 // THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY

 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR

 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE

 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,

 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,

 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR

 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF

 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING

 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 //

 // Questions? Contact Eric T. Phipps (etphipp@sandia.gov).

 //

 // ***********************************************************************

 // @HEADER


 #ifndef STOKHOS_LINEAR_SPARSE_3_TENSOR_HPP

 #define STOKHOS_LINEAR_SPARSE_3_TENSOR_HPP


 #include "Kokkos_Core.hpp"


 #include "Stokhos_Multiply.hpp"

 #include "Stokhos_ProductBasis.hpp"

 #include "Stokhos_Sparse3Tensor.hpp"

 #include "Teuchos_ParameterList.hpp"

 #include "Stokhos_TinyVec.hpp"


 //----------------------------------------------------------------------------

 //----------------------------------------------------------------------------


 namespace Stokhos {


 template< typename ValueType , class ExecutionSpace , int BlockSize >

 class LinearSparse3Tensor {

 public:


   typedef ExecutionSpace                       execution_space ;

   typedef typename execution_space::size_type  size_type ;

   typedef ValueType                        value_type ;


   static const int block_size = BlockSize;


 private:


   typedef Kokkos::View< value_type[], execution_space > value_array_type ;


   value_array_type   m_value ;

   size_type          m_dim ;

   size_type          m_aligned_dim ;

   size_type          m_nnz ;

   size_type          m_flops ;

   bool               m_symmetric ;


 public:


   inline

   ~LinearSparse3Tensor() {}


   inline

   LinearSparse3Tensor() :

     m_value() ,

     m_dim() ,

     m_aligned_dim(),

     m_nnz(0) ,

     m_flops(0) ,

     m_symmetric(false) {}


   inline

   LinearSparse3Tensor( const LinearSparse3Tensor & rhs ) :

     m_value( rhs.m_value ) ,

     m_dim( rhs.m_dim ),

     m_aligned_dim( rhs.m_aligned_dim ),

     m_nnz( rhs.m_nnz ) ,

     m_flops( rhs.m_flops ) ,

     m_symmetric( rhs.m_symmetric ) {}


   inline

   LinearSparse3Tensor & operator = ( const LinearSparse3Tensor & rhs )

   {

     m_value = rhs.m_value ;

     m_dim = rhs.m_dim ;

     m_aligned_dim = rhs.m_aligned_dim;

     m_nnz = rhs.m_nnz;

     m_flops = rhs.m_flops;

     m_symmetric = rhs.m_symmetric;

     return *this ;

   }


   KOKKOS_INLINE_FUNCTION

   size_type dimension() const { return m_dim ; }


   KOKKOS_INLINE_FUNCTION

   size_type aligned_dimension() const { return m_aligned_dim ; }


   KOKKOS_INLINE_FUNCTION

   size_type entry_count() const

   { return m_value.extent(0); }


    KOKKOS_INLINE_FUNCTION

    bool symmetric() const

    { return m_symmetric; }


   KOKKOS_INLINE_FUNCTION

   const value_type & value( const size_type entry ) const

   { return m_value( entry ); }


   KOKKOS_INLINE_FUNCTION

   size_type num_non_zeros() const

   { return m_nnz; }


   KOKKOS_INLINE_FUNCTION

   size_type num_flops() const

   { return m_flops; }


   template <typename OrdinalType>

   static LinearSparse3Tensor

   create( const Stokhos::ProductBasis<OrdinalType,ValueType>& basis,

           const Stokhos::Sparse3Tensor<OrdinalType,ValueType>& Cijk,

           const Teuchos::ParameterList& params)

   {

     const bool symmetric = params.get<bool>("Symmetric");


     // Allocate tensor data -- currently assuming isotropic

     const size_type dim = basis.size();

     LinearSparse3Tensor tensor ;

     tensor.m_dim = dim;

     tensor.m_aligned_dim = dim;

     if (tensor.m_aligned_dim % block_size)

       tensor.m_aligned_dim += block_size - tensor.m_aligned_dim % block_size;

     tensor.m_symmetric = symmetric;

     tensor.m_nnz = symmetric ? 2 : 3 ;

     tensor.m_value = value_array_type( "value" , tensor.m_nnz );


     // Create mirror, is a view if is host memory

     typename value_array_type::HostMirror

       host_value = Kokkos::create_mirror_view( tensor.m_value );


     // Get Cijk values

     Teuchos::Array< Teuchos::RCP<const Stokhos::OneDOrthogPolyBasis<OrdinalType,ValueType> > > bases = basis.getCoordinateBases();

     Teuchos::RCP< Stokhos::Dense3Tensor<OrdinalType,ValueType> > cijk =

       bases[0]->computeTripleProductTensor();

     // For non-isotropic, need to take products of these over basis components

     host_value(0) = (*cijk)(0,0,0);

     host_value(1) = (*cijk)(0,1,1);

     if (!symmetric)

       host_value(2) = (*cijk)(1,1,1);


     // Copy data to device if necessary

     Kokkos::deep_copy( tensor.m_value , host_value );


     tensor.m_flops = 8*dim;

     if (!symmetric)

       tensor.m_flops += 2*dim ;


     return tensor ;

   }

 };


 template< class Device , typename OrdinalType , typename ValueType , int BlockSize >

 LinearSparse3Tensor<ValueType, Device,BlockSize>

 create_linear_sparse_3_tensor(

   const Stokhos::ProductBasis<OrdinalType,ValueType>& basis,

   const Stokhos::Sparse3Tensor<OrdinalType,ValueType>& Cijk,

   const Teuchos::ParameterList& params)

 {

   return LinearSparse3Tensor<ValueType, Device, BlockSize>::create(

     basis, Cijk, params );

 }


 template < typename ValueType, typename Device, int BlockSize >

 class BlockMultiply< LinearSparse3Tensor< ValueType , Device , BlockSize > >

 {

 public:


   typedef typename Device::size_type size_type ;

   typedef LinearSparse3Tensor< ValueType , Device , BlockSize > tensor_type ;


   template< typename MatrixValue , typename VectorValue >

   KOKKOS_INLINE_FUNCTION

   static void apply( const tensor_type & tensor ,

                      const MatrixValue * const a ,

                      const VectorValue * const x ,

                            VectorValue * const y )

   {

     const size_type block_size = tensor_type::block_size;

     typedef TinyVec<ValueType,block_size,true> TV;

     const size_type dim = tensor.dimension();


     const ValueType c0 = tensor.value(0);

     const ValueType c1 = tensor.value(1);

     const ValueType a0 = a[0];

     const ValueType x0 = x[0];


     if (block_size > 1) {


       TV vc0(c0), vc1(c1), va0(a0), vx0(x0), vy0;

       TV ai, ai2, xi, yi;


       const MatrixValue *aa = a;

       const VectorValue *xx = x;

       VectorValue *yy = y;

       vy0.zero();


       const size_type nBlock = dim / block_size;

       const size_type iEnd = nBlock * block_size;


       if (tensor.symmetric()) {


         size_type i=0;

         for ( ; i < iEnd; i+=block_size,aa+=block_size,xx+=block_size,yy+=block_size) {

           ai.aligned_load(aa);

           ai2 = ai;

           xi.aligned_load(xx);

           yi.aligned_load(yy);


           // y[i] += c1*(a0*xi + ai*x0);

           ai.times_equal(vx0);

           ai2.times_equal(xi);

           xi.times_equal(va0);

           xi.plus_equal(ai);

           xi.times_equal(vc1);

           yi.plus_equal(xi);

           yi.aligned_scatter(yy);


           // y0  += c1*ai*xi;

           ai2.times_equal(vc1);

           vy0.plus_equal(ai2);

         }

         ValueType y0 = vy0.sum();


         // Do remaining entries with a scalar loop

         for ( ; i < dim; ++i) {

           const ValueType ai = *aa++;

           const ValueType xi = *xx++;

           *yy++ += c1*(a0*xi + ai*x0);

           y0  += c1*ai*xi;

         }

         y[0] += y0 + (c0-3.0*c1)*a0*x0;

       }

       else {


         const ValueType c2 = tensor.value(2);

         TV vc2(c2);

         size_type i=0;

         for ( ; i < iEnd; i+=block_size,aa+=block_size,xx+=block_size,yy+=block_size) {

           ai.aligned_load(aa);

           ai2 = ai;

           xi.aligned_load(xx);

           yi.aligned_load(yy);


           // y[i] += c1*(a0*xi + ai*x0) + c2*aixi;

           ai.times_equal(vx0);

           ai2.times_equal(xi);

           xi.times_equal(va0);

           xi.plus_equal(ai);

           xi.times_equal(vc1);

           yi.plus_equal(xi);

           ai = ai2;

           ai.times_equal(vc2);

           yi.plus_equal(ai);

           yi.aligned_scatter(yy);


           // y0  += c1*aixi;

           ai2.times_equal(vc1);

           vy0.plus_equal(ai2);

         }

         ValueType y0 = vy0.sum();


         // Do remaining entries with a scalar loop

         for ( ; i < dim; ++i) {

           const ValueType ai = *aa++;

           const ValueType xi = *xx++;

           const ValueType aixi = ai*xi;

           *yy++ += c1*(a0*xi + ai*x0) + c2*aixi;

           y0  += c1*aixi;

         }

         y[0] += y0 + (c0-3.0*c1-c2)*a0*x0;


       }


     }


     else {


       ValueType y0 = c0*a0*x0;


       if (tensor.symmetric()) {


         for ( size_type i = 1; i < dim; ++i) {

           const ValueType ai = a[i];

           const ValueType xi = x[i];

           y[i] += c1*(a0*xi + ai*x0);

           y0  += c1*ai*xi;

         }

         y[0] += y0;


       }

       else {


         const ValueType c2 = tensor.value(2);

         for ( size_type i = 1; i < dim; ++i) {

           const ValueType ai = a[i];

           const ValueType xi = x[i];

           const ValueType aixi = ai*xi;

           y[i] += c1*(a0*xi + ai*x0) + c2*aixi;

           y0  += c1*aixi;

         }

         y[0] += y0;


       }


     }


   }


   KOKKOS_INLINE_FUNCTION

   static size_type matrix_size( const tensor_type & tensor )

   { return tensor.dimension(); }


   KOKKOS_INLINE_FUNCTION

   static size_type vector_size( const tensor_type & tensor )

   { return tensor.dimension(); }

 };


 } /* namespace Stokhos */


 //----------------------------------------------------------------------------

 //----------------------------------------------------------------------------


 #endif /* #ifndef STOKHOS_LINEAR_SPARSE_3_TENSOR_HPP */

Stokhos_Multiply.hpp

Stokhos_Sparse3Tensor.hpp

Stokhos::LinearSparse3Tensor::entry_count
KOKKOS_INLINE_FUNCTION size_type entry_count() const
Number of sparse entries.
Definition: Stokhos_LinearSparse3Tensor.hpp:127

Stokhos::Sparse3Tensor
Data structure storing a sparse 3-tensor C(i,j,k) in a a compressed format.
Definition: Stokhos_Sparse3Tensor.hpp:56

Teuchos::ParameterList::get
T & get(ParameterList &l, const std::string &name)

Stokhos::LinearSparse3Tensor::m_value
value_array_type m_value
Definition: Stokhos_LinearSparse3Tensor.hpp:75

Stokhos::TinyVec
Definition: Stokhos_TinyVec.hpp:345

Stokhos::LinearSparse3Tensor::value_type
ValueType value_type
Definition: Stokhos_LinearSparse3Tensor.hpp:67

Stokhos::LinearSparse3Tensor::create
static LinearSparse3Tensor create(const Stokhos::ProductBasis< OrdinalType, ValueType > &basis, const Stokhos::Sparse3Tensor< OrdinalType, ValueType > &Cijk, const Teuchos::ParameterList &params)
Definition: Stokhos_LinearSparse3Tensor.hpp:152

Stokhos_ProductBasis.hpp

Stokhos::LinearSparse3Tensor::num_non_zeros
KOKKOS_INLINE_FUNCTION size_type num_non_zeros() const
Number of non-zero&#39;s.
Definition: Stokhos_LinearSparse3Tensor.hpp:142

Stokhos::LinearSparse3Tensor::value_array_type
Kokkos::View< value_type[], execution_space > value_array_type
Definition: Stokhos_LinearSparse3Tensor.hpp:73

Stokhos::LinearSparse3Tensor::m_symmetric
bool m_symmetric
Definition: Stokhos_LinearSparse3Tensor.hpp:80

Stokhos::BlockMultiply< LinearSparse3Tensor< ValueType, Device, BlockSize > >::size_type
Device::size_type size_type
Definition: Stokhos_LinearSparse3Tensor.hpp:210

Stokhos::BlockMultiply< LinearSparse3Tensor< ValueType, Device, BlockSize > >::matrix_size
static KOKKOS_INLINE_FUNCTION size_type matrix_size(const tensor_type &tensor)
Definition: Stokhos_LinearSparse3Tensor.hpp:352

Stokhos::LinearSparse3Tensor::~LinearSparse3Tensor
~LinearSparse3Tensor()
Definition: Stokhos_LinearSparse3Tensor.hpp:85

Stokhos::LinearSparse3Tensor::dimension
KOKKOS_INLINE_FUNCTION size_type dimension() const
Dimension of the tensor.
Definition: Stokhos_LinearSparse3Tensor.hpp:119

Stokhos::LinearSparse3Tensor::symmetric
KOKKOS_INLINE_FUNCTION bool symmetric() const
Is tensor built from symmetric PDFs.
Definition: Stokhos_LinearSparse3Tensor.hpp:132

Stokhos::LinearSparse3Tensor::execution_space
ExecutionSpace execution_space
Definition: Stokhos_LinearSparse3Tensor.hpp:65

Teuchos_ParameterList.hpp

Stokhos::LinearSparse3Tensor
Sparse product tensor with replicated entries to provide subsets with a given coordinate.
Definition: Stokhos_LinearSparse3Tensor.hpp:62

Stokhos::LinearSparse3Tensor::size_type
execution_space::size_type size_type
Definition: Stokhos_LinearSparse3Tensor.hpp:66

Stokhos::BlockMultiply< LinearSparse3Tensor< ValueType, Device, BlockSize > >::apply
static KOKKOS_INLINE_FUNCTION void apply(const tensor_type &tensor, const MatrixValue *const a, const VectorValue *const x, VectorValue *const y)
Definition: Stokhos_LinearSparse3Tensor.hpp:215

Stokhos::BlockMultiply< LinearSparse3Tensor< ValueType, Device, BlockSize > >::tensor_type
LinearSparse3Tensor< ValueType, Device, BlockSize > tensor_type
Definition: Stokhos_LinearSparse3Tensor.hpp:211

Kokkos::deep_copy
void deep_copy(const Stokhos::CrsMatrix< ValueType, DstDevice, Layout > &dst, const Stokhos::CrsMatrix< ValueType, SrcDevice, Layout > &src)
Definition: Stokhos_CrsMatrix.hpp:688

Stokhos::ProductBasis< OrdinalType, ValueType >

Teuchos::ParameterList

Stokhos::LinearSparse3Tensor::operator=
LinearSparse3Tensor & operator=(const LinearSparse3Tensor &rhs)
Definition: Stokhos_LinearSparse3Tensor.hpp:106

Stokhos::LinearSparse3Tensor::LinearSparse3Tensor
LinearSparse3Tensor()
Definition: Stokhos_LinearSparse3Tensor.hpp:88

Stokhos::ProductBasis::getCoordinateBases
virtual Teuchos::Array< Teuchos::RCP< const OneDOrthogPolyBasis< ordinal_type, value_type > > > getCoordinateBases() const =0
Return array of coordinate bases.

Kokkos::cijk
KOKKOS_INLINE_FUNCTION constexpr std::enable_if< is_view_uq_pce< view_type >::value, typename CijkType< view_type >::type >::type cijk(const view_type &view)
Definition: KokkosExp_View_UQ_PCE_Contiguous.hpp:217

Stokhos::LinearSparse3Tensor::m_nnz
size_type m_nnz
Definition: Stokhos_LinearSparse3Tensor.hpp:78

Stokhos::LinearSparse3Tensor::aligned_dimension
KOKKOS_INLINE_FUNCTION size_type aligned_dimension() const
Dimension of the tensor.
Definition: Stokhos_LinearSparse3Tensor.hpp:123

Stokhos::LinearSparse3Tensor::LinearSparse3Tensor
LinearSparse3Tensor(const LinearSparse3Tensor &rhs)
Definition: Stokhos_LinearSparse3Tensor.hpp:97

Stokhos::LinearSparse3Tensor::value
KOKKOS_INLINE_FUNCTION const value_type & value(const size_type entry) const
Value for entry &#39;entry&#39;.
Definition: Stokhos_LinearSparse3Tensor.hpp:137

Stokhos::LinearSparse3Tensor::block_size
static const int block_size
Definition: Stokhos_LinearSparse3Tensor.hpp:69

Stokhos_TinyVec.hpp

Stokhos::LinearSparse3Tensor::num_flops
KOKKOS_INLINE_FUNCTION size_type num_flops() const
Number flop&#39;s per multiply-add.
Definition: Stokhos_LinearSparse3Tensor.hpp:147

Stokhos::LinearSparse3Tensor::m_aligned_dim
size_type m_aligned_dim
Definition: Stokhos_LinearSparse3Tensor.hpp:77

Stokhos::LinearSparse3Tensor::m_dim
size_type m_dim
Definition: Stokhos_LinearSparse3Tensor.hpp:76

Stokhos::BlockMultiply
Definition: Stokhos_Multiply.hpp:151

Teuchos::RCP

Stokhos::LinearSparse3Tensor::m_flops
size_type m_flops
Definition: Stokhos_LinearSparse3Tensor.hpp:79

Stokhos::BlockMultiply< LinearSparse3Tensor< ValueType, Device, BlockSize > >::vector_size
static KOKKOS_INLINE_FUNCTION size_type vector_size(const tensor_type &tensor)
Definition: Stokhos_LinearSparse3Tensor.hpp:356

Stokhos::create_linear_sparse_3_tensor
LinearSparse3Tensor< ValueType, Device, BlockSize > create_linear_sparse_3_tensor(const Stokhos::ProductBasis< OrdinalType, ValueType > &basis, const Stokhos::Sparse3Tensor< OrdinalType, ValueType > &Cijk, const Teuchos::ParameterList &params)
Definition: Stokhos_LinearSparse3Tensor.hpp:196

Stokhos::OrthogPolyBasis::size
virtual ordinal_type size() const =0
Return total size of basis.

Kokkos::create_mirror_view
Stokhos::CrsMatrix< ValueType, Device, Layout >::HostMirror create_mirror_view(const Stokhos::CrsMatrix< ValueType, Device, Layout > &A)
Definition: Stokhos_CrsMatrix.hpp:677

Teuchos::Array