16 #ifndef __INTREPID2_HGRAD_HEX_C1_FEM_DEF_HPP__
17 #define __INTREPID2_HGRAD_HEX_C1_FEM_DEF_HPP__
24 template<EOperator opType>
25 template<
typename OutputViewType,
26 typename inputViewType>
27 KOKKOS_INLINE_FUNCTION
29 Basis_HGRAD_HEX_C1_FEM::Serial<opType>::
30 getValues( OutputViewType output,
31 const inputViewType input ) {
33 case OPERATOR_VALUE : {
34 const auto x = input(0);
35 const auto y = input(1);
36 const auto z = input(2);
39 output.access(0) = (1.0 - x)*(1.0 - y)*(1.0 - z)/8.0;
40 output.access(1) = (1.0 + x)*(1.0 - y)*(1.0 - z)/8.0;
41 output.access(2) = (1.0 + x)*(1.0 + y)*(1.0 - z)/8.0;
42 output.access(3) = (1.0 - x)*(1.0 + y)*(1.0 - z)/8.0;
44 output.access(4) = (1.0 - x)*(1.0 - y)*(1.0 + z)/8.0;
45 output.access(5) = (1.0 + x)*(1.0 - y)*(1.0 + z)/8.0;
46 output.access(6) = (1.0 + x)*(1.0 + y)*(1.0 + z)/8.0;
47 output.access(7) = (1.0 - x)*(1.0 + y)*(1.0 + z)/8.0;
50 case OPERATOR_GRAD : {
51 const auto x = input(0);
52 const auto y = input(1);
53 const auto z = input(2);
56 output.access(0, 0) = -(1.0 - y)*(1.0 - z)/8.0;
57 output.access(0, 1) = -(1.0 - x)*(1.0 - z)/8.0;
58 output.access(0, 2) = -(1.0 - x)*(1.0 - y)/8.0;
60 output.access(1, 0) = (1.0 - y)*(1.0 - z)/8.0;
61 output.access(1, 1) = -(1.0 + x)*(1.0 - z)/8.0;
62 output.access(1, 2) = -(1.0 + x)*(1.0 - y)/8.0;
64 output.access(2, 0) = (1.0 + y)*(1.0 - z)/8.0;
65 output.access(2, 1) = (1.0 + x)*(1.0 - z)/8.0;
66 output.access(2, 2) = -(1.0 + x)*(1.0 + y)/8.0;
68 output.access(3, 0) = -(1.0 + y)*(1.0 - z)/8.0;
69 output.access(3, 1) = (1.0 - x)*(1.0 - z)/8.0;
70 output.access(3, 2) = -(1.0 - x)*(1.0 + y)/8.0;
72 output.access(4, 0) = -(1.0 - y)*(1.0 + z)/8.0;
73 output.access(4, 1) = -(1.0 - x)*(1.0 + z)/8.0;
74 output.access(4, 2) = (1.0 - x)*(1.0 - y)/8.0;
76 output.access(5, 0) = (1.0 - y)*(1.0 + z)/8.0;
77 output.access(5, 1) = -(1.0 + x)*(1.0 + z)/8.0;
78 output.access(5, 2) = (1.0 + x)*(1.0 - y)/8.0;
80 output.access(6, 0) = (1.0 + y)*(1.0 + z)/8.0;
81 output.access(6, 1) = (1.0 + x)*(1.0 + z)/8.0;
82 output.access(6, 2) = (1.0 + x)*(1.0 + y)/8.0;
84 output.access(7, 0) = -(1.0 + y)*(1.0 + z)/8.0;
85 output.access(7, 1) = (1.0 - x)*(1.0 + z)/8.0;
86 output.access(7, 2) = (1.0 - x)*(1.0 + y)/8.0;
90 const auto x = input(0);
91 const auto y = input(1);
92 const auto z = input(2);
95 output.access(0, 0) = 0.0;
96 output.access(0, 1) = (1.0 - z)/8.0;
97 output.access(0, 2) = (1.0 - y)/8.0;
98 output.access(0, 3) = 0.0;
99 output.access(0, 4) = (1.0 - x)/8.0;
100 output.access(0, 5) = 0.0;
102 output.access(1, 0) = 0.0;
103 output.access(1, 1) = -(1.0 - z)/8.0;
104 output.access(1, 2) = -(1.0 - y)/8.0;
105 output.access(1, 3) = 0.0;
106 output.access(1, 4) = (1.0 + x)/8.0;
107 output.access(1, 5) = 0.0;
109 output.access(2, 0) = 0.0;
110 output.access(2, 1) = (1.0 - z)/8.0;
111 output.access(2, 2) = -(1.0 + y)/8.0;
112 output.access(2, 3) = 0.0;
113 output.access(2, 4) = -(1.0 + x)/8.0;
114 output.access(2, 5) = 0.0;
116 output.access(3, 0) = 0.0;
117 output.access(3, 1) = -(1.0 - z)/8.0;
118 output.access(3, 2) = (1.0 + y)/8.0;
119 output.access(3, 3) = 0.0;
120 output.access(3, 4) = -(1.0 - x)/8.0;
121 output.access(3, 5) = 0.0;
124 output.access(4, 0) = 0.0;
125 output.access(4, 1) = (1.0 + z)/8.0;
126 output.access(4, 2) = -(1.0 - y)/8.0;
127 output.access(4, 3) = 0.0;
128 output.access(4, 4) = -(1.0 - x)/8.0;
129 output.access(4, 5) = 0.0;
131 output.access(5, 0) = 0.0;
132 output.access(5, 1) = -(1.0 + z)/8.0;
133 output.access(5, 2) = (1.0 - y)/8.0;
134 output.access(5, 3) = 0.0;
135 output.access(5, 4) = -(1.0 + x)/8.0;
136 output.access(5, 5) = 0.0;
138 output.access(6, 0) = 0.0;
139 output.access(6, 1) = (1.0 + z)/8.0;
140 output.access(6, 2) = (1.0 + y)/8.0;
141 output.access(6, 3) = 0.0;
142 output.access(6, 4) = (1.0 + x)/8.0;
143 output.access(6, 5) = 0.0;
145 output.access(7, 0) = 0.0;
146 output.access(7, 1) = -(1.0 + z)/8.0;
147 output.access(7, 2) = -(1.0 + y)/8.0;
148 output.access(7, 3) = 0.0;
149 output.access(7, 4) = (1.0 - x)/8.0;
150 output.access(7, 5) = 0.0;
157 output.access(0, 0) = 0.0;
158 output.access(0, 1) = 0.0;
159 output.access(0, 2) = 0.0;
160 output.access(0, 3) = 0.0;
161 output.access(0, 4) = -1.0/8.0;
162 output.access(0, 5) = 0.0;
163 output.access(0, 6) = 0.0;
164 output.access(0, 7) = 0.0;
165 output.access(0, 8) = 0.0;
166 output.access(0, 9) = 0.0;
169 output.access(1, 0) = 0.0;
170 output.access(1, 1) = 0.0;
171 output.access(1, 2) = 0.0;
172 output.access(1, 3) = 0.0;
173 output.access(1, 4) = 1.0/8.0;
174 output.access(1, 5) = 0.0;
175 output.access(1, 6) = 0.0;
176 output.access(1, 7) = 0.0;
177 output.access(1, 8) = 0.0;
178 output.access(1, 9) = 0.0;
181 output.access(2, 0) = 0.0;
182 output.access(2, 1) = 0.0;
183 output.access(2, 2) = 0.0;
184 output.access(2, 3) = 0.0;
185 output.access(2, 4) = -1.0/8.0;
186 output.access(2, 5) = 0.0;
187 output.access(2, 6) = 0.0;
188 output.access(2, 7) = 0.0;
189 output.access(2, 8) = 0.0;
190 output.access(2, 9) = 0.0;
193 output.access(3, 0) = 0.0;
194 output.access(3, 1) = 0.0;
195 output.access(3, 2) = 0.0;
196 output.access(3, 3) = 0.0;
197 output.access(3, 4) = 1.0/8.0;
198 output.access(3, 5) = 0.0;
199 output.access(3, 6) = 0.0;
200 output.access(3, 7) = 0.0;
201 output.access(3, 8) = 0.0;
202 output.access(3, 9) = 0.0;
205 output.access(4, 0) = 0.0;
206 output.access(4, 1) = 0.0;
207 output.access(4, 2) = 0.0;
208 output.access(4, 3) = 0.0;
209 output.access(4, 4) = 1.0/8.0;
210 output.access(4, 5) = 0.0;
211 output.access(4, 6) = 0.0;
212 output.access(4, 7) = 0.0;
213 output.access(4, 8) = 0.0;
214 output.access(4, 9) = 0.0;
217 output.access(5, 0) = 0.0;
218 output.access(5, 1) = 0.0;
219 output.access(5, 2) = 0.0;
220 output.access(5, 3) = 0.0;
221 output.access(5, 4) = -1.0/8.0;
222 output.access(5, 5) = 0.0;
223 output.access(5, 6) = 0.0;
224 output.access(5, 7) = 0.0;
225 output.access(5, 8) = 0.0;
226 output.access(5, 9) = 0.0;
229 output.access(6, 0) = 0.0;
230 output.access(6, 1) = 0.0;
231 output.access(6, 2) = 0.0;
232 output.access(6, 3) = 0.0;
233 output.access(6, 4) = 1.0/8.0;
234 output.access(6, 5) = 0.0;
235 output.access(6, 6) = 0.0;
236 output.access(6, 7) = 0.0;
237 output.access(6, 8) = 0.0;
238 output.access(6, 9) = 0.0;
241 output.access(7, 0) = 0.0;
242 output.access(7, 1) = 0.0;
243 output.access(7, 2) = 0.0;
244 output.access(7, 3) = 0.0;
245 output.access(7, 4) = -1.0/8.0;
246 output.access(7, 5) = 0.0;
247 output.access(7, 6) = 0.0;
248 output.access(7, 7) = 0.0;
249 output.access(7, 8) = 0.0;
250 output.access(7, 9) = 0.0;
254 case OPERATOR_MAX : {
255 const ordinal_type jend = output.extent(1);
256 const ordinal_type iend = output.extent(0);
258 for (ordinal_type j=0;j<jend;++j)
259 for (ordinal_type i=0;i<iend;++i)
260 output.access(i, j) = 0.0;
264 INTREPID2_TEST_FOR_ABORT( opType != OPERATOR_VALUE &&
265 opType != OPERATOR_GRAD &&
266 opType != OPERATOR_CURL &&
267 opType != OPERATOR_D2 &&
268 opType != OPERATOR_MAX,
269 ">>> ERROR: (Intrepid2::Basis_HGRAD_HEX_C1_FEM::Serial::getValues) operator is not supported");
275 template<
typename DT,
276 typename outputValueValueType,
class ...outputValueProperties,
277 typename inputPointValueType,
class ...inputPointProperties>
279 Basis_HGRAD_HEX_C1_FEM::
280 getValues(
const typename DT::execution_space& space,
281 Kokkos::DynRankView<outputValueValueType,outputValueProperties...> outputValues,
282 const Kokkos::DynRankView<inputPointValueType, inputPointProperties...> inputPoints,
283 const EOperator operatorType ) {
284 typedef Kokkos::DynRankView<outputValueValueType,outputValueProperties...> outputValueViewType;
285 typedef Kokkos::DynRankView<inputPointValueType, inputPointProperties...> inputPointViewType;
286 typedef typename ExecSpace<typename inputPointViewType::execution_space,typename DT::execution_space>::ExecSpaceType ExecSpaceType;
289 const auto loopSize = inputPoints.extent(0);
290 Kokkos::RangePolicy<ExecSpaceType,Kokkos::Schedule<Kokkos::Static> > policy(space, 0, loopSize);
292 switch (operatorType) {
294 case OPERATOR_VALUE: {
295 typedef Functor<outputValueViewType,inputPointViewType,OPERATOR_VALUE> FunctorType;
296 Kokkos::parallel_for( policy, FunctorType(outputValues, inputPoints) );
301 typedef Functor<outputValueViewType,inputPointViewType,OPERATOR_GRAD> FunctorType;
302 Kokkos::parallel_for( policy, FunctorType(outputValues, inputPoints) );
305 case OPERATOR_CURL: {
306 INTREPID2_TEST_FOR_EXCEPTION( operatorType == OPERATOR_CURL, std::invalid_argument,
307 ">>> ERROR (Basis_HGRAD_HEX_C1_FEM): CURL is invalid operator for rank-0 (scalar) functions in 3D");
312 INTREPID2_TEST_FOR_EXCEPTION( (operatorType == OPERATOR_DIV), std::invalid_argument,
313 ">>> ERROR (Basis_HGRAD_HEX_C1_FEM): DIV is invalid operator for rank-0 (scalar) functions in 3D");
318 typedef Functor<outputValueViewType,inputPointViewType,OPERATOR_D2> FunctorType;
319 Kokkos::parallel_for( policy, FunctorType(outputValues, inputPoints) );
323 typedef Functor<outputValueViewType,inputPointViewType,OPERATOR_D3> FunctorType;
324 Kokkos::parallel_for( policy, FunctorType(outputValues, inputPoints) );
334 typedef Functor<outputValueViewType,inputPointViewType,OPERATOR_MAX> FunctorType;
335 Kokkos::parallel_for( policy, FunctorType(outputValues, inputPoints) );
339 INTREPID2_TEST_FOR_EXCEPTION( !( Intrepid2::isValidOperator(operatorType) ), std::invalid_argument,
340 ">>> ERROR (Basis_HGRAD_HEX_C1_FEM): Invalid operator type");
348 template<
typename DT,
typename OT,
typename PT>
351 constexpr ordinal_type spaceDim = 3;
352 this->basisCardinality_ = 8;
353 this->basisDegree_ = 1;
354 this->basisCellTopologyKey_ = shards::Hexahedron<8>::key;
355 this->basisType_ = BASIS_FEM_DEFAULT;
356 this->basisCoordinates_ = COORDINATES_CARTESIAN;
357 this->functionSpace_ = FUNCTION_SPACE_HGRAD;
362 const ordinal_type tagSize = 4;
363 const ordinal_type posScDim = 0;
364 const ordinal_type posScOrd = 1;
365 const ordinal_type posDfOrd = 2;
368 ordinal_type tags[32] = { 0, 0, 0, 1,
383 this->setOrdinalTagData(this->tagToOrdinal_,
386 this->basisCardinality_,
400 Kokkos::DynRankView<typename ScalarViewType::value_type,typename DT::execution_space::array_layout,Kokkos::HostSpace>
401 dofCoords(
"dofCoordsHost", this->basisCardinality_,spaceDim);
403 dofCoords(0,0) = -1.0; dofCoords(0,1) = -1.0; dofCoords(0,2) = -1.0;
404 dofCoords(1,0) = 1.0; dofCoords(1,1) = -1.0; dofCoords(1,2) = -1.0;
405 dofCoords(2,0) = 1.0; dofCoords(2,1) = 1.0; dofCoords(2,2) = -1.0;
406 dofCoords(3,0) = -1.0; dofCoords(3,1) = 1.0; dofCoords(3,2) = -1.0;
407 dofCoords(4,0) = -1.0; dofCoords(4,1) = -1.0; dofCoords(4,2) = 1.0;
408 dofCoords(5,0) = 1.0; dofCoords(5,1) = -1.0; dofCoords(5,2) = 1.0;
409 dofCoords(6,0) = 1.0; dofCoords(6,1) = 1.0; dofCoords(6,2) = 1.0;
410 dofCoords(7,0) = -1.0; dofCoords(7,1) = 1.0; dofCoords(7,2) = 1.0;
412 this->dofCoords_ = Kokkos::create_mirror_view(
typename DT::memory_space(), dofCoords);
413 Kokkos::deep_copy(this->dofCoords_, dofCoords);
416 template<
typename DT,
typename OT,
typename PT>
419 ordinal_type& perTeamSpaceSize,
420 ordinal_type& perThreadSpaceSize,
422 const EOperator operatorType)
const {
423 perTeamSpaceSize = 0;
424 perThreadSpaceSize = 0;
427 template<
typename DT,
typename OT,
typename PT>
428 KOKKOS_INLINE_FUNCTION
431 OutputViewType outputValues,
432 const PointViewType inputPoints,
433 const EOperator operatorType,
434 const typename Kokkos::TeamPolicy<typename DT::execution_space>::member_type& team_member,
435 const typename DT::execution_space::scratch_memory_space & scratchStorage,
436 const ordinal_type subcellDim,
437 const ordinal_type subcellOrdinal)
const {
439 INTREPID2_TEST_FOR_ABORT( !((subcellDim <= 0) && (subcellOrdinal == -1)),
440 ">>> ERROR: (Intrepid2::Basis_HGRAD_HEX_C1_FEM::getValues), The capability of selecting subsets of basis functions has not been implemented yet.");
442 (void) scratchStorage;
444 const int numPoints = inputPoints.extent(0);
446 switch(operatorType) {
448 Kokkos::parallel_for (Kokkos::TeamThreadRange (team_member, numPoints), [=] (ordinal_type& pt) {
449 auto output = Kokkos::subview( outputValues, Kokkos::ALL(), pt, Kokkos::ALL() );
450 const auto input = Kokkos::subview( inputPoints, pt, Kokkos::ALL() );
455 Kokkos::parallel_for (Kokkos::TeamThreadRange (team_member, numPoints), [=] (ordinal_type& pt) {
456 auto output = Kokkos::subview( outputValues, Kokkos::ALL(), pt, Kokkos::ALL() );
457 const auto input = Kokkos::subview( inputPoints, pt, Kokkos::ALL() );
458 Impl::Basis_HGRAD_HEX_C1_FEM::Serial<OPERATOR_GRAD>::getValues( output, input);
Kokkos::View< ordinal_type *, typename ExecutionSpace::array_layout, Kokkos::HostSpace > OrdinalTypeArray1DHost
View type for 1d host array.
Basis_HGRAD_HEX_C1_FEM()
Constructor.
See Intrepid2::Basis_HGRAD_HEX_C1_FEM.
Kokkos::DynRankView< PointValueType, Kokkos::LayoutStride, DeviceType > PointViewType
View type for input points.
virtual void getScratchSpaceSize(ordinal_type &perTeamSpaceSize, ordinal_type &perThreadSpaceSize, const PointViewType inputPointsconst, const EOperator operatorType=OPERATOR_VALUE) const override
Return the size of the scratch space, in bytes, needed for using the team-level implementation of get...
virtual void getValues(const ExecutionSpace &space, OutputViewType outputValues, const PointViewType inputPoints, const EOperator operatorType=OPERATOR_VALUE) const override
Evaluation of a FEM basis on a reference cell.