Tpetra parallel linear algebra  Version of the Day
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
Tpetra_Details_DeepCopyTeuchosTimerInjection.cpp
1 /*
2 // @HEADER
3 // ***********************************************************************
4 //
5 // Tpetra: Templated Linear Algebra Services Package
6 // Copyright (2008) Sandia Corporation
7 //
8 // Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
9 // the U.S. Government retains certain rights in this software.
10 //
11 // Redistribution and use in source and binary forms, with or without
12 // modification, are permitted provided that the following conditions are
13 // met:
14 //
15 // 1. Redistributions of source code must retain the above copyright
16 // notice, this list of conditions and the following disclaimer.
17 //
18 // 2. Redistributions in binary form must reproduce the above copyright
19 // notice, this list of conditions and the following disclaimer in the
20 // documentation and/or other materials provided with the distribution.
21 //
22 // 3. Neither the name of the Corporation nor the names of the
23 // contributors may be used to endorse or promote products derived from
24 // this software without specific prior written permission.
25 //
26 // THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
27 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
29 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
30 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
31 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
32 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
33 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
34 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
35 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
36 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
37 //
38 // ************************************************************************
39 // @HEADER
40 */
42 #include "TpetraCore_config.h"
44 #include "Kokkos_Core.hpp"
45 #include "Teuchos_TimeMonitor.hpp"
46 #include "Teuchos_Time.hpp"
47 #include "Teuchos_RCP.hpp"
48 #ifdef HAVE_TEUCHOS_ADD_TIME_MONITOR_TO_STACKED_TIMER
49 #include "Teuchos_StackedTimer.hpp"
50 #include <sstream>
51 #endif
52 #include <string>
53 
55 
56 
57 
58 namespace Tpetra {
59 namespace Details {
60 
61  namespace DeepCopyTimerInjection {
62  Teuchos::RCP<Teuchos::Time> timer_;
63  bool initialized_ = false;
64 
65  void kokkosp_begin_deep_copy(Kokkos::Tools::SpaceHandle dst_handle, const char* dst_name, const void* dst_ptr,
66  Kokkos::Tools::SpaceHandle src_handle, const char* src_name, const void* src_ptr,
67  uint64_t size) {
68  // In verbose mode, we add the src/dst names as well
69  std::string extra_label;
71  extra_label = std::string(" {") + src_name + "=>" + dst_name + "," + std::to_string(size)+"}";
72  }
73 
74  if(timer_ != Teuchos::null)
75  std::cout << "WARNING: Kokkos::deep_copy() started within another Kokkos::deep_copy(). Timers will be in error"<<std::endl;
76 
77  // If the src_name is "Scalar" then we're doing a "Fill" style copy from host to devices, which we want to record separately.
78  if(!strcmp(src_name,"Scalar"))
79  timer_ = Teuchos::TimeMonitor::getNewTimer(std::string("Kokkos::deep_copy_scalar [")+src_handle.name+"=>"+dst_handle.name+"]" + extra_label);
80  // If the size is under 65 bytes, we're going to flag this as "small" to make it easier to watch the big stuff
81  else if(size <= 64)
82  timer_ = Teuchos::TimeMonitor::getNewTimer(std::string("Kokkos::deep_copy_small [")+src_handle.name+"=>"+dst_handle.name+"]" + extra_label);
83  else
84  timer_ = Teuchos::TimeMonitor::getNewTimer(std::string("Kokkos::deep_copy [")+src_handle.name+"=>"+dst_handle.name+"]" + extra_label);
85  timer_->start();
86  timer_->incrementNumCalls();
87 #ifdef HAVE_TEUCHOS_ADD_TIME_MONITOR_TO_STACKED_TIMER
88  const auto stackedTimer = Teuchos::TimeMonitor::getStackedTimer();
89  if (nonnull(stackedTimer))
90  stackedTimer->start(timer_->name());
91 #endif
92  }
93 
94  void kokkosp_end_deep_copy() {
95  if (timer_ != Teuchos::null) {
96  timer_->stop();
97 #ifdef HAVE_TEUCHOS_ADD_TIME_MONITOR_TO_STACKED_TIMER
98  try {
99  const auto stackedTimer = Teuchos::TimeMonitor::getStackedTimer();
100  if (nonnull(stackedTimer))
101  stackedTimer->stop(timer_->name());
102  }
103  catch (std::runtime_error&) {
104  std::ostringstream warning;
105  warning <<
106  "\n*********************************************************************\n"
107  "WARNING: Overlapping timers detected!\n"
108  "A TimeMonitor timer was stopped before a nested subtimer was\n"
109  "stopped. This is not allowed by the StackedTimer. This corner case\n"
110  "typically occurs if the TimeMonitor is stored in an RCP and the RCP is\n"
111  "assigned to a new timer. To disable this warning, either fix the\n"
112  "ordering of timer creation and destuction or disable the StackedTimer\n";
113  std::cout << warning.str() << std::endl;
114  Teuchos::TimeMonitor::setStackedTimer(Teuchos::null);
115  }
116 #endif
117  }
118 
119  timer_ = Teuchos::null;
120  }
121  }// end DeepCopyTimerInjection
122 
123 
124 
125  void AddKokkosDeepCopyToTimeMonitor(bool force) {
126  if (!DeepCopyTimerInjection::initialized_) {
128  Kokkos::Tools::Experimental::set_begin_deep_copy_callback(DeepCopyTimerInjection::kokkosp_begin_deep_copy);
129  Kokkos::Tools::Experimental::set_end_deep_copy_callback(DeepCopyTimerInjection::kokkosp_end_deep_copy);
130  DeepCopyTimerInjection::initialized_=true;
131 
132  }
133  }
134  }
135 
136 
137 } // namespace Details
138 } // namespace Tpetra
139 
Declaration of Tpetra::Details::DeepCopyTeuchosTimerInjection, a class that uses Kokkos&#39; profiling li...
static bool timeKokkosDeepCopy()
Add Teuchos timers for all host calls to Kokkos::deep_copy(). This is especially useful for identifyi...
static bool timeKokkosDeepCopyVerbose()
Adds verbose output to Kokkos deep_copy timers This is especially useful for identifying host/device ...
Declaration of Tpetra::Details::Behavior, a class that describes Tpetra&#39;s behavior.