SemiDiscreteOT/SoftmaxRefinement_8cc_source.html

#include "SemiDiscreteOT/solvers/SoftmaxRefinement.h"

#include <deal.II/base/quadrature_lib.h>


template <int dim, int spacedim>


SoftmaxRefinement<dim, spacedim>::SoftmaxRefinement(

    MPI_Comm mpi_comm,

    const DoFHandler<dim, spacedim>& dof_handler,

    const Mapping<dim, spacedim>& mapping,

    const FiniteElement<dim, spacedim>& fe,

    const LinearAlgebra::distributed::Vector<double>& source_density,

    unsigned int quadrature_order,

    double distance_threshold,

    bool use_log_sum_exp_trick)

    : mpi_communicator(mpi_comm)

    , n_mpi_processes(Utilities::MPI::n_mpi_processes(mpi_comm))

    , this_mpi_process(Utilities::MPI::this_mpi_process(mpi_comm))

    , pcout(std::cout, this_mpi_process == 0)

    , dof_handler(dof_handler)

    , mapping(mapping)

    , fe(fe)

    , source_density(source_density)

    , quadrature_order(quadrature_order)

    , current_distance_threshold(distance_threshold)

    , use_log_sum_exp_trick(use_log_sum_exp_trick)

{

    distance_function = [](const Point<spacedim> x, const Point<spacedim> y) { return euclidean_distance<spacedim>(x, y); };

}


template <int dim, int spacedim>


void SoftmaxRefinement<dim, spacedim>::setup_rtree()

{

    namespace bgi = boost::geometry::index;

    std::vector<IndexedPoint> indexed_points;

    indexed_points.reserve(current_target_points_coarse->size());


    for (std::size_t i = 0; i < current_target_points_coarse->size(); ++i) {

        indexed_points.emplace_back((*current_target_points_coarse)[i], i);

    }


    target_points_rtree = RTree(indexed_points.begin(), indexed_points.end());

}


template <int dim, int spacedim>


std::vector<std::size_t> SoftmaxRefinement<dim, spacedim>::find_nearest_target_points(

    const Point<spacedim>& query_point) const

{

    namespace bgi = boost::geometry::index;

    std::vector<std::size_t> indices;


    for (const auto& indexed_point : target_points_rtree |

         bgi::adaptors::queried(bgi::satisfies([&](const IndexedPoint& p) {

             return distance_function(p.first, query_point) <= current_distance_threshold;

         })))

    {

        indices.push_back(indexed_point.second);

    }


    return indices;

}


template <int dim, int spacedim>


void SoftmaxRefinement<dim, spacedim>::local_assemble(

    const typename DoFHandler<dim, spacedim>::active_cell_iterator &cell,

    ScratchData &scratch_data,

    CopyData &copy_data)

{

    if (!cell->is_locally_owned())

        return;


    scratch_data.fe_values.reinit(cell);

    const std::vector<Point<spacedim>> &q_points = scratch_data.fe_values.get_quadrature_points();

    scratch_data.fe_values.get_function_values(source_density, scratch_data.density_values);


    copy_data.potential_values = 0;


    const unsigned int n_q_points = q_points.size();

    const double lambda_inv = 1.0 / current_lambda;

    const double threshold_sq = current_distance_threshold * current_distance_threshold;


    // Get relevant coarse target points for this cell

    std::vector<std::size_t> cell_target_indices_coarse = find_nearest_target_points(cell->center());


    if (cell_target_indices_coarse.empty()) return;


    const unsigned int n_target_points_coarse = cell_target_indices_coarse.size();

    std::vector<Point<spacedim>> target_positions_coarse(n_target_points_coarse);

    std::vector<double> target_densities_coarse(n_target_points_coarse);

    std::vector<double> potential_values_coarse(n_target_points_coarse);


    // Load coarse target point data

    for (size_t i = 0; i < n_target_points_coarse; ++i) {

        const size_t idx = cell_target_indices_coarse[i];

        target_positions_coarse[i] = (*current_target_points_coarse)[idx];

        target_densities_coarse[i] = (*current_target_density_coarse)[idx];

        potential_values_coarse[i] = (*current_potential_coarse)[idx];

    }


    // Get fine points that are children of the coarse points

    std::vector<std::size_t> cell_target_indices_fine;

    std::vector<Point<spacedim>> target_positions_fine;


    // Add bounds checking for child_indices_ access

    if (current_level < 0 || current_level >= static_cast<int>(current_child_indices->size())) {

        std::cerr << "Error: Invalid level " << current_level << " for child_indices_ of size "

                  << current_child_indices->size() << std::endl;

        return;

    }


    for (size_t i = 0; i < n_target_points_coarse; ++i) {

        const size_t coarse_idx = cell_target_indices_coarse[i];

        if (coarse_idx >= (*current_child_indices)[current_level].size()) {

            std::cerr << "Error: Invalid coarse index " << coarse_idx << " for child_indices_["

                      << current_level << "] of size " << (*current_child_indices)[current_level].size()

                      << std::endl;

            continue;

        }

        const auto& children = (*current_child_indices)[current_level][coarse_idx];


        for (const auto& child_idx : children) {

            if (child_idx >= current_target_points_fine->size()) {

                std::cerr << "Error: Invalid child index " << child_idx << " for target_points_fine of size "

                          << current_target_points_fine->size() << std::endl;

                continue;

            }

            cell_target_indices_fine.push_back(child_idx);

            target_positions_fine.push_back((*current_target_points_fine)[child_idx]);

        }

    }


    const unsigned int n_target_points_fine = cell_target_indices_fine.size();

    if (n_target_points_fine == 0) {

        std::cerr << "Warning: No valid fine points found for coarse points at level " << current_level << std::endl;

        return;

    }


    // For each quadrature point

    for (unsigned int q = 0; q < n_q_points; ++q) {

        const Point<spacedim> &x = q_points[q];

        const double density_value = scratch_data.density_values[q];

        const double JxW = scratch_data.fe_values.JxW(q);


        // First compute normalization using coarse points

        double total_sum_exp = 0.0;

        double max_exponent = -std::numeric_limits<double>::max();

        std::vector<double> exp_terms_coarse(n_target_points_coarse);


        if (use_log_sum_exp_trick) {

            // First pass: find maximum exponent

            #pragma omp simd reduction(max:max_exponent)

            for (size_t i = 0; i < n_target_points_coarse; ++i) {

                const double local_dist2 = std::pow(distance_function(x,  target_positions_coarse[i]), 2);

                if (local_dist2 <= threshold_sq) {

                    const double exponent = (potential_values_coarse[i] - 0.5 * local_dist2) * lambda_inv;

                    max_exponent = std::max(max_exponent, exponent);

                }

            }


            // Second pass: compute shifted exponentials

            #pragma omp simd reduction(+:total_sum_exp)

            for (size_t i = 0; i < n_target_points_coarse; ++i) {

                const double local_dist2 = std::pow(distance_function(x,  target_positions_coarse[i]), 2);

                if (local_dist2 <= threshold_sq) {

                    const double shifted_exp = std::exp((potential_values_coarse[i] - 0.5 * local_dist2) * lambda_inv - max_exponent);

                    exp_terms_coarse[i] = target_densities_coarse[i] * shifted_exp;

                    total_sum_exp += exp_terms_coarse[i];

                }

            }

        } else {

            // Original computation method

            #pragma omp simd reduction(+:total_sum_exp)

            for (size_t i = 0; i < n_target_points_coarse; ++i) {

                const double local_dist2 = std::pow(distance_function(x,  target_positions_coarse[i]), 2);

                if (local_dist2 <= threshold_sq) {

                    exp_terms_coarse[i] = target_densities_coarse[i] *

                        std::exp((potential_values_coarse[i] - 0.5 * local_dist2) * lambda_inv);

                    total_sum_exp += exp_terms_coarse[i];

                }

            }

        }


        if (total_sum_exp <= 0.0) continue;


        // Now update potential for fine points using their parent's exp term for normalization

        double scale = density_value * JxW / total_sum_exp;

        if (use_log_sum_exp_trick) {

            scale *= std::exp(-max_exponent);

        }


        #pragma omp simd

        for (size_t i = 0; i < n_target_points_fine; ++i) {

            const double local_dist2_fine = std::pow(distance_function(x,  target_positions_fine[i]), 2);

            if (local_dist2_fine <= threshold_sq) {

                const double exp_term_fine = std::exp((- 0.5 * local_dist2_fine) * lambda_inv);

                copy_data.potential_values[cell_target_indices_fine[i]] += scale * exp_term_fine;

            }

        }

    }

}


template <int dim, int spacedim>


Vector<double> SoftmaxRefinement<dim, spacedim>::compute_refinement(

    const std::vector<Point<spacedim>>& target_points_fine,

    const Vector<double>& target_density_fine,

    const std::vector<Point<spacedim>>& target_points_coarse,

    const Vector<double>& target_density_coarse,

    const Vector<double>& potential_coarse,

    double regularization_param,

    int level,

    const std::vector<std::vector<std::vector<size_t>>>& child_indices)

{

    // Store computation parameters

    current_target_points_fine = &target_points_fine;

    current_target_density_fine = &target_density_fine;

    current_target_points_coarse = &target_points_coarse;

    current_target_density_coarse = &target_density_coarse;

    current_potential_coarse = &potential_coarse;

    current_child_indices = &child_indices;

    current_level = level;

    current_lambda = regularization_param;


    // Initialize RTree for spatial queries

    setup_rtree();


    // Initialize output potential

    Vector<double> potential_fine(target_points_fine.size());

    Vector<double> local_process_potential(target_points_fine.size());


    // Create appropriate quadrature

    std::unique_ptr<Quadrature<dim>> quadrature;

    const bool use_simplex = (dynamic_cast<const FE_SimplexP<dim, spacedim>*>(&fe) != nullptr);

    if (use_simplex) {

        quadrature = std::make_unique<QGaussSimplex<dim>>(quadrature_order);

    } else {

        quadrature = std::make_unique<QGauss<dim>>(quadrature_order);

    }


    // Create scratch and copy data objects

    ScratchData scratch_data(fe, mapping, *quadrature);

    CopyData copy_data(target_points_fine.size());


    // Create filtered iterator for locally owned cells

    FilteredIterator<typename DoFHandler<dim, spacedim>::active_cell_iterator>

        begin_filtered(IteratorFilters::LocallyOwnedCell(),

                      dof_handler.begin_active()),

        end_filtered(IteratorFilters::LocallyOwnedCell(),

                    dof_handler.end());


    // Parallel assembly

    WorkStream::run(

        begin_filtered,

        end_filtered,

        [this](const typename DoFHandler<dim, spacedim>::active_cell_iterator &cell,

               ScratchData &scratch_data,

               CopyData &copy_data) {

            this->local_assemble(cell, scratch_data, copy_data);

        },

        [&local_process_potential](const CopyData &copy_data) {

            local_process_potential += copy_data.potential_values;

        },

        scratch_data,

        copy_data);


    // Sum up contributions across all MPI processes

    potential_fine = 0;

    Utilities::MPI::sum(local_process_potential, mpi_communicator, potential_fine);


    // Apply epsilon scaling to potential

    if (Utilities::MPI::this_mpi_process(mpi_communicator) == 0) {

        for (unsigned int i = 0; i < target_points_fine.size(); ++i) {

            if (potential_fine[i] > 0.0) {

                potential_fine[i] = -regularization_param * std::log(potential_fine[i]);

            }

        }

    }


    // Broadcast final potential to all processes

    potential_fine = Utilities::MPI::broadcast(mpi_communicator, potential_fine, 0);


    return potential_fine;

}


// Explicit instantiation

template class SoftmaxRefinement<2>;

template class SoftmaxRefinement<3>;

template class SoftmaxRefinement<2, 3>;

SoftmaxRefinement.h

SoftmaxRefinement
A class for refining the optimal transport potential using a softmax operation.
Definition SoftmaxRefinement.h:43

SoftmaxRefinement::find_nearest_target_points
std::vector< std::size_t > find_nearest_target_points(const Point< spacedim > &query_point) const
Finds the nearest target points to a query point.
Definition SoftmaxRefinement.cc:44

SoftmaxRefinement::setup_rtree
void setup_rtree()
Sets up the R-tree.
Definition SoftmaxRefinement.cc:30

SoftmaxRefinement::compute_refinement
Vector< double > compute_refinement(const std::vector< Point< spacedim > > &target_points_fine, const Vector< double > &target_density_fine, const std::vector< Point< spacedim > > &target_points_coarse, const Vector< double > &target_density_coarse, const Vector< double > &potential_coarse, double regularization_param, int current_level, const std::vector< std::vector< std::vector< size_t > > > &child_indices)
Computes the refined potential.
Definition SoftmaxRefinement.cc:201

SoftmaxRefinement::SoftmaxRefinement
SoftmaxRefinement(MPI_Comm mpi_comm, const DoFHandler< dim, spacedim > &dof_handler, const Mapping< dim, spacedim > &mapping, const FiniteElement< dim, spacedim > &fe, const LinearAlgebra::distributed::Vector< double > &source_density, unsigned int quadrature_order, double distance_threshold, bool use_log_sum_exp_trick=true)
Constructor for the SoftmaxRefinement class.
Definition SoftmaxRefinement.cc:5

SoftmaxRefinement::local_assemble
void local_assemble(const typename DoFHandler< dim, spacedim >::active_cell_iterator &cell, ScratchData &scratch_data, CopyData &copy_data)
Assembles the local contributions to the refined potential.
Definition SoftmaxRefinement.cc:62

SoftmaxRefinement::distance_function
std::function< double(const Point< spacedim > &, const Point< spacedim > &)> distance_function
The distance function.
Definition SoftmaxRefinement.h:137

SoftmaxRefinement::RTree
boost::geometry::index::rtree< IndexedPoint, RTreeParams > RTree
Definition SoftmaxRefinement.h:149

SoftmaxRefinement::IndexedPoint
std::pair< Point< spacedim >, std::size_t > IndexedPoint
Definition SoftmaxRefinement.h:147

SoftmaxRefinement::CopyData
A struct to hold copy data for parallel assembly.
Definition SoftmaxRefinement.h:80

SoftmaxRefinement::CopyData::potential_values
Vector< double > potential_values
The potential values at the target points.
Definition SoftmaxRefinement.h:81

SoftmaxRefinement::ScratchData
A struct to hold scratch data for parallel assembly.
Definition SoftmaxRefinement.h:58

SoftmaxRefinement::ScratchData::fe_values
FEValues< dim, spacedim > fe_values
FEValues object for the current cell.
Definition SoftmaxRefinement.h:73

SoftmaxRefinement::ScratchData::density_values
std::vector< double > density_values
The density values at the quadrature points of the current cell.
Definition SoftmaxRefinement.h:74