Compadre  1.5.9
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
GMLS Tutorial

based on GMLS_Device.cpp

GMLS Example with Device Views

This tutorial sets up a batch of GMLS problems, solves the minimization problems, and applies the coefficients produced to data.

Parse Command Line Arguments

// called from command line
int main (int argc, char* args[]) {
// initializes MPI (if available) with command line arguments given
#ifdef COMPADRE_USE_MPI
MPI_Init(&argc, &args);
#endif
// initializes Kokkos with command line arguments given
Kokkos::initialize(argc, args);
// becomes false if the computed solution not within the failure_threshold of the actual solution
bool all_passed = true;
// code block to reduce scope for all Kokkos View allocations
// otherwise, Views may be deallocating when we call Kokkos finalize() later
{
CommandLineProcessor clp(argc, args);
auto order = clp.order;
auto dimension = clp.dimension;
auto number_target_coords = clp.number_target_coords;
auto constraint_name = clp.constraint_name;
auto solver_name = clp.solver_name;
auto problem_name = clp.problem_name;
auto number_of_batches = clp.number_of_batches;
bool keep_coefficients = number_of_batches==1;
// the functions we will be seeking to reconstruct are in the span of the basis
// of the reconstruction space we choose for GMLS, so the error should be very small
const double failure_tolerance = 1e-9;
// Laplacian is a second order differential operator, which we expect to be slightly less accurate
const double laplacian_failure_tolerance = 1e-9;
// minimum neighbors for unisolvency is the same as the size of the polynomial basis
const int min_neighbors = Compadre::GMLS::getNP(order, dimension);

Setting Up The Point Cloud

// approximate spacing of source sites
double h_spacing = 0.05;
int n_neg1_to_1 = 2*(1/h_spacing) + 1; // always odd
// number of source coordinate sites that will fill a box of [-1,1]x[-1,1]x[-1,1] with a spacing approximately h
const int number_source_coords = std::pow(n_neg1_to_1, dimension);
// coordinates of source sites
Kokkos::View<double**, Kokkos::DefaultExecutionSpace> source_coords_device("source coordinates",
number_source_coords, 3);
Kokkos::View<double**>::HostMirror source_coords = Kokkos::create_mirror_view(source_coords_device);
// coordinates of target sites
Kokkos::View<double**, Kokkos::DefaultExecutionSpace> target_coords_device ("target coordinates", number_target_coords, 3);
Kokkos::View<double**>::HostMirror target_coords = Kokkos::create_mirror_view(target_coords_device);
// fill source coordinates with a uniform grid
int source_index = 0;
double this_coord[3] = {0,0,0};
for (int i=-n_neg1_to_1/2; i<n_neg1_to_1/2+1; ++i) {
this_coord[0] = i*h_spacing;
for (int j=-n_neg1_to_1/2; j<n_neg1_to_1/2+1; ++j) {
this_coord[1] = j*h_spacing;
for (int k=-n_neg1_to_1/2; k<n_neg1_to_1/2+1; ++k) {
this_coord[2] = k*h_spacing;
if (dimension==3) {
source_coords(source_index,0) = this_coord[0];
source_coords(source_index,1) = this_coord[1];
source_coords(source_index,2) = this_coord[2];
source_index++;
}
}
if (dimension==2) {
source_coords(source_index,0) = this_coord[0];
source_coords(source_index,1) = this_coord[1];
source_coords(source_index,2) = 0;
source_index++;
}
}
if (dimension==1) {
source_coords(source_index,0) = this_coord[0];
source_coords(source_index,1) = 0;
source_coords(source_index,2) = 0;
source_index++;
}
}
// fill target coords somewhere inside of [-0.5,0.5]x[-0.5,0.5]x[-0.5,0.5]
for(int i=0; i<number_target_coords; i++){
// first, we get a uniformly random distributed direction
double rand_dir[3] = {0,0,0};
for (int j=0; j<dimension; ++j) {
// rand_dir[j] is in [-0.5, 0.5]
rand_dir[j] = ((double)rand() / (double) RAND_MAX) - 0.5;
}
// then we get a uniformly random radius
for (int j=0; j<dimension; ++j) {
target_coords(i,j) = rand_dir[j];
}
}

Performing Neighbor Search

// Point cloud construction for neighbor search
// CreatePointCloudSearch constructs an object of type PointCloudSearch, but deduces the templates for you
auto point_cloud_search(CreatePointCloudSearch(source_coords, dimension));
double epsilon_multiplier = 1.4;
// neighbor_lists_device will contain all neighbor lists (for each target site) in a compressed row format
// Initially, we do a dry-run to calculate neighborhood sizes before actually storing the result. This is
// why we can start with a neighbor_lists_device size of 0.
Kokkos::View<int*> neighbor_lists_device("neighbor lists",
0); // first column is # of neighbors
Kokkos::View<int*>::HostMirror neighbor_lists = Kokkos::create_mirror_view(neighbor_lists_device);
// number_of_neighbors_list must be the same size as the number of target sites so that it can be populated
// with the number of neighbors for each target site.
Kokkos::View<int*> number_of_neighbors_list_device("number of neighbor lists",
number_target_coords); // first column is # of neighbors
Kokkos::View<int*>::HostMirror number_of_neighbors_list = Kokkos::create_mirror_view(number_of_neighbors_list_device);
// each target site has a window size
Kokkos::View<double*, Kokkos::DefaultExecutionSpace> epsilon_device("h supports", number_target_coords);
Kokkos::View<double*>::HostMirror epsilon = Kokkos::create_mirror_view(epsilon_device);
// query the point cloud to generate the neighbor lists using a kdtree to produce the n nearest neighbor
// to each target site, adding (epsilon_multiplier-1)*100% to whatever the distance away the further neighbor used is from
// each target to the view for epsilon
//
// This dry run populates number_of_neighbors_list with neighborhood sizes
size_t storage_size = point_cloud_search.generateCRNeighborListsFromKNNSearch(true /*dry run*/, target_coords, neighbor_lists,
number_of_neighbors_list, epsilon, min_neighbors, epsilon_multiplier);
// resize neighbor_lists_device so as to be large enough to contain all neighborhoods
Kokkos::resize(neighbor_lists_device, storage_size);
neighbor_lists = Kokkos::create_mirror_view(neighbor_lists_device);
// query the point cloud a second time, but this time storing results into neighbor_lists
point_cloud_search.generateCRNeighborListsFromKNNSearch(false /*not dry run*/, target_coords, neighbor_lists,
number_of_neighbors_list, epsilon, min_neighbors, epsilon_multiplier);

Creating The Data

// source coordinates need copied to device before using to construct sampling data
Kokkos::deep_copy(source_coords_device, source_coords);
// target coordinates copied next, because it is a convenient time to send them to device
Kokkos::deep_copy(target_coords_device, target_coords);
// need Kokkos View storing true solution
Kokkos::View<double*, Kokkos::DefaultExecutionSpace> sampling_data_device("samples of true solution",
source_coords_device.extent(0));
Kokkos::View<double**, Kokkos::DefaultExecutionSpace> gradient_sampling_data_device("samples of true gradient",
source_coords_device.extent(0), dimension);
Kokkos::View<double**, Kokkos::DefaultExecutionSpace> divergence_sampling_data_device
("samples of true solution for divergence test", source_coords_device.extent(0), dimension);
Kokkos::parallel_for("Sampling Manufactured Solutions", Kokkos::RangePolicy<Kokkos::DefaultExecutionSpace>
(0,source_coords.extent(0)), KOKKOS_LAMBDA(const int i) {
// coordinates of source site i
double xval = source_coords_device(i,0);
double yval = (dimension>1) ? source_coords_device(i,1) : 0;
double zval = (dimension>2) ? source_coords_device(i,2) : 0;
// data for targets with scalar input
sampling_data_device(i) = trueSolution(xval, yval, zval, order, dimension);
// data for targets with vector input (divergence)
double true_grad[3] = {0,0,0};
trueGradient(true_grad, xval, yval,zval, order, dimension);
for (int j=0; j<dimension; ++j) {
gradient_sampling_data_device(i,j) = true_grad[j];
// data for target with vector input (curl)
divergence_sampling_data_device(i,j) = divergenceTestSamples(xval, yval, zval, j, dimension);
}
});

Setting Up The GMLS Object

// Copy data back to device (they were filled on the host)
// We could have filled Kokkos Views with memory space on the host
// and used these instead, and then the copying of data to the device
// would be performed in the GMLS class
Kokkos::deep_copy(neighbor_lists_device, neighbor_lists);
Kokkos::deep_copy(number_of_neighbors_list_device, number_of_neighbors_list);
Kokkos::deep_copy(epsilon_device, epsilon);
// initialize an instance of the GMLS class
order, dimension,
solver_name.c_str(), problem_name.c_str(), constraint_name.c_str(),
2 /*manifold order*/);
// pass in neighbor lists, number of neighbor lists, source coordinates, target coordinates, and window sizes
//
// neighbor lists has a compressed row format and is a 1D view:
// dimensions: ? (determined by neighbor search, but total size of the sum of the number of neighbors over all target sites)
//
// number of neighbors list is a 1D view:
// dimensions: (# number of target sites)
// each entry contains the number of neighbors for a target site
//
// source coordinates have the format:
// dimensions: (# number of source sites) X (dimension)
// entries in the neighbor lists (integers) correspond to rows of this 2D array
//
// target coordinates have the format:
// dimensions: (# number of target sites) X (dimension)
// # of target sites is same as # of rows of neighbor lists
//
my_GMLS.setProblemData(neighbor_lists_device, number_of_neighbors_list_device, source_coords_device, target_coords_device, epsilon_device);
// create a vector of target operations
std::vector<TargetOperation> lro(5);
// and then pass them to the GMLS class
my_GMLS.addTargets(lro);
// sets the weighting kernel function from WeightingFunctionType
my_GMLS.setWeightingType(WeightingFunctionType::Power);
// power to use in that weighting kernel function
my_GMLS.setWeightingParameter(2);
// generate the alphas that to be combined with data for each target operation requested in lro
my_GMLS.generateAlphas(number_of_batches, keep_coefficients /* keep polynomial coefficients, only needed for a test later in this program */);

Apply GMLS Alphas To Data

// it is important to note that if you expect to use the data as a 1D view, then you should use double*
// however, if you know that the target operation will result in a 2D view (vector or matrix output),
// then you should template with double** as this is something that can not be infered from the input data
// or the target operator at compile time. Additionally, a template argument is required indicating either
// Kokkos::HostSpace or Kokkos::DefaultExecutionSpace::memory_space()
// The Evaluator class takes care of handling input data views as well as the output data views.
// It uses information from the GMLS class to determine how many components are in the input
// as well as output for any choice of target functionals and then performs the contactions
// on the data using the alpha coefficients generated by the GMLS class, all on the device.
Evaluator gmls_evaluator(&my_GMLS);
auto output_value = gmls_evaluator.applyAlphasToDataAllComponentsAllTargetSites<double*, Kokkos::HostSpace>
(sampling_data_device, ScalarPointEvaluation);
auto output_laplacian = gmls_evaluator.applyAlphasToDataAllComponentsAllTargetSites<double*, Kokkos::HostSpace>
(sampling_data_device, LaplacianOfScalarPointEvaluation);
auto output_gradient = gmls_evaluator.applyAlphasToDataAllComponentsAllTargetSites<double**, Kokkos::HostSpace>
(sampling_data_device, GradientOfScalarPointEvaluation);
auto output_divergence = gmls_evaluator.applyAlphasToDataAllComponentsAllTargetSites<double*, Kokkos::HostSpace>
(gradient_sampling_data_device, DivergenceOfVectorPointEvaluation, VectorPointSample);
auto output_curl = gmls_evaluator.applyAlphasToDataAllComponentsAllTargetSites<double**, Kokkos::HostSpace>
(divergence_sampling_data_device, CurlOfVectorPointEvaluation);
// retrieves polynomial coefficients instead of remapped field
decltype(output_curl) scalar_coefficients;
if (number_of_batches==1)
scalar_coefficients =
gmls_evaluator.applyFullPolynomialCoefficientsBasisToDataAllComponents<double**, Kokkos::HostSpace>
(sampling_data_device);

Check That Solutions Are Correct

// loop through the target sites
for (int i=0; i<number_target_coords; i++) {
// load value from output
double GMLS_value = output_value(i);
// load laplacian from output
double GMLS_Laplacian = output_laplacian(i);
// load partial x from gradient
// this is a test that the scalar_coefficients 2d array returned hold valid entries
// scalar_coefficients(i,1)*1./epsilon(i) is equivalent to the target operation acting
// on the polynomials applied to the polynomial coefficients
double GMLS_GradX = (number_of_batches==1) ? scalar_coefficients(i,1)*1./epsilon(i) : output_gradient(i,0);
// load partial y from gradient
double GMLS_GradY = (dimension>1) ? output_gradient(i,1) : 0;
// load partial z from gradient
double GMLS_GradZ = (dimension>2) ? output_gradient(i,2) : 0;
// load divergence from output
double GMLS_Divergence = output_divergence(i);
// load curl from output
double GMLS_CurlX = (dimension>1) ? output_curl(i,0) : 0;
double GMLS_CurlY = (dimension>1) ? output_curl(i,1) : 0;
double GMLS_CurlZ = (dimension>2) ? output_curl(i,2) : 0;
// target site i's coordinate
double xval = target_coords(i,0);
double yval = (dimension>1) ? target_coords(i,1) : 0;
double zval = (dimension>2) ? target_coords(i,2) : 0;
// evaluation of various exact solutions
double actual_value = trueSolution(xval, yval, zval, order, dimension);
double actual_Laplacian = trueLaplacian(xval, yval, zval, order, dimension);
double actual_Gradient[3] = {0,0,0}; // initialized for 3, but only filled up to dimension
trueGradient(actual_Gradient, xval, yval, zval, order, dimension);
double actual_Divergence;
actual_Divergence = trueLaplacian(xval, yval, zval, order, dimension);
double actual_Curl[3] = {0,0,0}; // initialized for 3, but only filled up to dimension
// (and not at all for dimimension = 1)
if (dimension>1) {
actual_Curl[0] = curlTestSolution(xval, yval, zval, 0, dimension);
actual_Curl[1] = curlTestSolution(xval, yval, zval, 1, dimension);
if (dimension>2) {
actual_Curl[2] = curlTestSolution(xval, yval, zval, 2, dimension);
}
}
// check actual function value
if(GMLS_value!=GMLS_value || std::abs(actual_value - GMLS_value) > failure_tolerance) {
all_passed = false;
std::cout << i << " Failed Actual by: " << std::abs(actual_value - GMLS_value) << std::endl;
}
// check Laplacian
if(std::abs(actual_Laplacian - GMLS_Laplacian) > laplacian_failure_tolerance) {
all_passed = false;
std::cout << i <<" Failed Laplacian by: " << std::abs(actual_Laplacian - GMLS_Laplacian) << std::endl;
}
// check gradient
if(std::abs(actual_Gradient[0] - GMLS_GradX) > failure_tolerance) {
all_passed = false;
std::cout << i << " Failed GradX by: " << std::abs(actual_Gradient[0] - GMLS_GradX) << std::endl;
if (dimension>1) {
if(std::abs(actual_Gradient[1] - GMLS_GradY) > failure_tolerance) {
all_passed = false;
std::cout << i << " Failed GradY by: " << std::abs(actual_Gradient[1] - GMLS_GradY) << std::endl;
}
}
if (dimension>2) {
if(std::abs(actual_Gradient[2] - GMLS_GradZ) > failure_tolerance) {
all_passed = false;
std::cout << i << " Failed GradZ by: " << std::abs(actual_Gradient[2] - GMLS_GradZ) << std::endl;
}
}
}
// check divergence
if(std::abs(actual_Divergence - GMLS_Divergence) > failure_tolerance) {
all_passed = false;
std::cout << i << " Failed Divergence by: " << std::abs(actual_Divergence - GMLS_Divergence) << std::endl;
}
// check curl
if (order > 2) { // reconstructed solution not in basis unless order greater than 2 used
double tmp_diff = 0;
if (dimension>1)
tmp_diff += std::abs(actual_Curl[0] - GMLS_CurlX) + std::abs(actual_Curl[1] - GMLS_CurlY);
if (dimension>2)
tmp_diff += std::abs(actual_Curl[2] - GMLS_CurlZ);
if(std::abs(tmp_diff) > failure_tolerance) {
all_passed = false;
std::cout << i << " Failed Curl by: " << std::abs(tmp_diff) << std::endl;
}
}
}

Finalize Program

} // end of code block to reduce scope, causing Kokkos View de-allocations
// otherwise, Views may be deallocating when we call Kokkos finalize() later
// finalize Kokkos and MPI (if available)
Kokkos::finalize();
#ifdef COMPADRE_USE_MPI
MPI_Finalize();
#endif
// output to user that test passed or failed
if(all_passed) {
fprintf(stdout, "Passed test \n");
return 0;
} else {
fprintf(stdout, "Failed test \n");
return -1;
}
} // main

Tutorial