Stokhos Package Browser (Single Doxygen Collection)  Version of the Day
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
Stokhos_KokkosCrsMatrixMPVectorUnitTest_Threads.cpp
Go to the documentation of this file.
1 // @HEADER
2 // ***********************************************************************
3 //
4 // Stokhos Package
5 // Copyright (2009) Sandia Corporation
6 //
7 // Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive
8 // license for use of this work by or on behalf of the U.S. Government.
9 //
10 // Redistribution and use in source and binary forms, with or without
11 // modification, are permitted provided that the following conditions are
12 // met:
13 //
14 // 1. Redistributions of source code must retain the above copyright
15 // notice, this list of conditions and the following disclaimer.
16 //
17 // 2. Redistributions in binary form must reproduce the above copyright
18 // notice, this list of conditions and the following disclaimer in the
19 // documentation and/or other materials provided with the distribution.
20 //
21 // 3. Neither the name of the Corporation nor the names of the
22 // contributors may be used to endorse or promote products derived from
23 // this software without specific prior written permission.
24 //
25 // THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
26 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
28 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
29 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
30 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
31 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
32 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
33 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
34 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
35 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 //
37 // Questions? Contact Eric T. Phipps (etphipp@sandia.gov).
38 //
39 // ***********************************************************************
40 // @HEADER
41 
45 
47 
48 #include "Kokkos_Core.hpp"
49 
50 // Instantiate test for Threads device
51 using Kokkos::Threads;
53 
54 template <typename Storage, typename Ordinal, typename MultiplyOp,
55  Ordinal NumPerThread, Ordinal ThreadsPerVector>
57  Ordinal num_cores,
58  Teuchos::FancyOStream& out) {
59  const Ordinal VectorSize = NumPerThread * ThreadsPerVector;
60  typedef typename Storage::template apply_N<VectorSize>::type storage_type;
61  typedef Sacado::MP::Vector<storage_type> Vector;
62 
63  const Ordinal nGrid = 5;
64 
65  bool success = true;
66  if (num_hyper_threads >= ThreadsPerVector) {
67  int row_threads = num_hyper_threads / ThreadsPerVector;
68  KokkosSparse::DeviceConfig dev_config(num_cores, ThreadsPerVector, row_threads);
69 
70  success = test_embedded_vector<Vector>(
71  nGrid, VectorSize, dev_config, MultiplyOp(), out);
72  }
73  return success;
74 }
75 
77 
79  Kokkos_CrsMatrix_MP, Multiply_1, Storage, MultiplyOp )
80 {
81  typedef typename Storage::ordinal_type Ordinal;
82  const Ordinal NumPerThread = 16;
83  const Ordinal ThreadsPerVector = 1;
84  success =
85  test_host_embedded_vector<Storage,Ordinal,MultiplyOp,NumPerThread,ThreadsPerVector>(num_hyper_threads, num_cores, out);
86 }
87 
89  Kokkos_CrsMatrix_MP, Multiply_2, Storage, MultiplyOp )
90 {
91  typedef typename Storage::ordinal_type Ordinal;
92  const Ordinal NumPerThread = 8;
93  const Ordinal ThreadsPerVector = 2;
94  success =
95  test_host_embedded_vector<Storage,Ordinal,MultiplyOp,NumPerThread,ThreadsPerVector>(num_hyper_threads, num_cores, out);
96 }
97 
98 #define CRS_MATRIX_MP_VECTOR_MULTIPLY_TESTS_STORAGE_OP( STORAGE, OP ) \
99  TEUCHOS_UNIT_TEST_TEMPLATE_2_INSTANT( \
100  Kokkos_CrsMatrix_MP, Multiply_1, STORAGE, OP ) \
101  TEUCHOS_UNIT_TEST_TEMPLATE_2_INSTANT( \
102  Kokkos_CrsMatrix_MP, Multiply_2, STORAGE, OP )
103 
104 // Notes: SFS, DS are defined in main test header (we are also being lazy
105 // and not putting ordinal/scalar/device in the names, assuming we will only
106 // do one combination). We can't do DefaultMultiply for DS because it
107 // uses partitioning
108 #define CRS_MATRIX_MP_VECTOR_MULTIPLY_TESTS_ORDINAL_SCALAR_DEVICE( ORDINAL, SCALAR, DEVICE ) \
109  CRS_MATRIX_MP_VECTOR_MULTIPLY_TESTS_STORAGE_OP( SFS, DefaultMultiply ) \
110  CRS_MATRIX_MP_VECTOR_MULTIPLY_TESTS_STORAGE_OP( SFS, KokkosMultiply ) \
111  CRS_MATRIX_MP_VECTOR_MULTIPLY_TESTS_STORAGE_OP( DS, DefaultMultiply ) \
112  CRS_MATRIX_MP_VECTOR_MULTIPLY_TESTS_STORAGE_OP( DS, KokkosMultiply )
113 
115 
116 int main( int argc, char* argv[] ) {
117  Teuchos::GlobalMPISession mpiSession(&argc, &argv);
118 
119  // Initialize threads
120  num_cores =
121  Kokkos::hwloc::get_available_numa_count() *
122  Kokkos::hwloc::get_available_cores_per_numa();
124  Kokkos::hwloc::get_available_threads_per_core();
125 
126  Kokkos::InitArguments init_args;
127  init_args.num_threads = num_cores*num_hyper_threads;
128  Kokkos::initialize( init_args );
129  Kokkos::print_configuration(std::cout);
130 
131  // Run tests
133 
134  // Finish up
135  Kokkos::finalize();
136 
137  return ret;
138 }
Stokhos::StandardStorage< int, double > storage_type
bool test_host_embedded_vector(Ordinal num_hyper_threads, Ordinal num_cores, Teuchos::FancyOStream &out)
#define CRSMATRIX_MP_VECTOR_TESTS_DEVICE(DEVICE)
static int runUnitTestsFromMain(int argc, char *argv[])
TEUCHOS_UNIT_TEST_TEMPLATE_2_DECL(Kokkos_SG_SpMv, CrsProductTensorCijk, Scalar, Device)
#define CRS_MATRIX_MP_VECTOR_MULTIPLY_TESTS_ORDINAL_SCALAR_DEVICE(ORDINAL, SCALAR, DEVICE)
int main(int argc, char **argv)
basic_FancyOStream< char > FancyOStream