Shamrock/doxygen/SinkParticlesUpdate_8cpp_source.html

// -------------------------------------------------------//

//

// SHAMROCK code for hydrodynamics

// Copyright (c) 2021-2026 Timothée David--Cléris <tim.shamrock@proton.me>

// SPDX-License-Identifier: CeCILL Free Software License Agreement v2.1

// Shamrock is licensed under the CeCILL 2.1 License, see LICENSE for more information

//

// -------------------------------------------------------//


#include "shambase/DistributedData.hpp"

#include "shambase/narrowing.hpp"

#include "shamalgs/collective/reduction.hpp"

#include "shamalgs/details/numeric/numeric.hpp"

#include "shamalgs/primitives/reduction.hpp"

#include "shambackends/DeviceBuffer.hpp"

#include "shambackends/kernel_call.hpp"

#include "shamcomm/logs.hpp"

#include "shammath/sphkernels.hpp"

#include "shammodels/sph/modules/SinkParticlesUpdate.hpp"

#include <shambackends/sycl.hpp>


template<class Tvec, template<class> class SPHKernel>

void shammodels::sph::modules::SinkParticlesUpdate<Tvec, SPHKernel>::accrete_particles(Tscal dt) {

    StackEntry stack_loc{};


    Tscal gpart_mass = solver_config.gpart_mass;


    if (storage.sinks.is_empty()) {

        return;

    }


    using namespace shamrock;

    using namespace shamrock::patch;


    PatchDataLayerLayout &pdl = scheduler().pdl_old();

    const u32 ixyz            = pdl.get_field_idx<Tvec>("xyz");

    const u32 ivxyz           = pdl.get_field_idx<Tvec>("vxyz");

    const u32 iaxyz           = pdl.get_field_idx<Tvec>("axyz");


    auto dev_sched       = shamsys::instance::get_compute_scheduler_ptr();

    sham::DeviceQueue &q = shambase::get_check_ref(dev_sched).get_queue();


    std::vector<Sink> &sink_parts = storage.sinks.get();


    u32 sink_id        = 0;

    bool had_accretion = false;

    std::string log    = "sink accretion :";


    struct AccretionFlagBufs {

        sham::DeviceBuffer<u32> not_accreted;

        sham::DeviceBuffer<u32> accreted;

    };


    for (size_t sink_id = 0; sink_id < sink_parts.size(); sink_id++) {

        Sink &s = sink_parts[sink_id];


        Tvec r_sink    = s.pos;

        Tvec v_sink    = s.velocity;

        Tscal acc_rad2 = s.accretion_radius * s.accretion_radius;


        // flags particles for accretion

        shambase::DistributedData<AccretionFlagBufs> accretion_flag_bufs{};


        scheduler().for_each_patchdata_nonempty([&](Patch cur_p, PatchDataLayer &pdat) {

            u32 Nobj = pdat.get_obj_cnt();


            sham::DeviceBuffer<Tvec> &buf_xyz  = pdat.get_field_buf_ref<Tvec>(ixyz);

            sham::DeviceBuffer<Tvec> &buf_vxyz = pdat.get_field_buf_ref<Tvec>(ivxyz);


            sham::DeviceBuffer<u32> not_accreted(Nobj, dev_sched);

            sham::DeviceBuffer<u32> accreted(Nobj, dev_sched);


            sham::kernel_call(

                q,

                sham::MultiRef{buf_xyz},

                sham::MultiRef{not_accreted, accreted},

                Nobj,

                [r_sink, acc_rad2](

                    u32 id_a,

                    const Tvec *__restrict xyz,

                    u32 *__restrict not_acc,

                    u32 *__restrict acc) {

                    Tvec r            = xyz[id_a] - r_sink;

                    bool not_accreted = sycl::dot(r, r) > acc_rad2;

                    not_acc[id_a]     = (not_accreted) ? 1 : 0;

                    acc[id_a]         = (!not_accreted) ? 1 : 0;

                });


            accretion_flag_bufs.add_obj(

                cur_p.id_patch, AccretionFlagBufs{std::move(not_accreted), std::move(accreted)});

        });


        // list the ids that will be accreted

        shambase::DistributedData<sham::DeviceBuffer<u32>> bufs_id_list_accrete{};


        scheduler().for_each_patchdata_nonempty([&](Patch cur_p, PatchDataLayer &pdat) {

            u32 Nobj = pdat.get_obj_cnt();


            sham::DeviceBuffer<u32> &accreted = accretion_flag_bufs.get(cur_p.id_patch).accreted;


            sham::DeviceBuffer<u32> id_list_accrete

                = shamalgs::stream_compact(dev_sched, accreted, Nobj);


            bufs_id_list_accrete.add_obj(cur_p.id_patch, std::move(id_list_accrete));

        });


        // compute the accreted mass, position moment and linear momentum

        Tscal s_acc_mass = 0;

        Tvec s_acc_mxyz  = {0, 0, 0};

        Tvec s_acc_pxyz  = {0, 0, 0};

        Tvec s_acc_maxyz = {0, 0, 0};

        Tvec s_acc_lxyz  = {0, 0, 0};


        scheduler().for_each_patchdata_nonempty([&](Patch cur_p, PatchDataLayer &pdat) {

            u32 Nobj = pdat.get_obj_cnt();


            sham::DeviceBuffer<Tvec> &buf_xyz  = pdat.get_field_buf_ref<Tvec>(ixyz);

            sham::DeviceBuffer<Tvec> &buf_vxyz = pdat.get_field_buf_ref<Tvec>(ivxyz);

            sham::DeviceBuffer<Tvec> &buf_axyz = pdat.get_field_buf_ref<Tvec>(iaxyz);


            sham::DeviceBuffer<u32> &id_list_accrete = bufs_id_list_accrete.get(cur_p.id_patch);


            // sum accreted values onto sink

            if (id_list_accrete.get_size() > 0) {

                u32 Naccrete = shambase::narrow_or_throw<u32>(id_list_accrete.get_size());


                Tscal acc_mass = gpart_mass * Naccrete;


                sham::DeviceBuffer<Tvec> pxyz_acc(Naccrete, dev_sched);

                sham::DeviceBuffer<Tvec> maxyz_acc(Naccrete, dev_sched);

                sham::DeviceBuffer<Tvec> mxyz_acc(Naccrete, dev_sched);

                sham::DeviceBuffer<Tvec> lxyz_acc(Naccrete, dev_sched);


                sham::kernel_call(

                    q,

                    sham::MultiRef{buf_xyz, buf_vxyz, buf_axyz, id_list_accrete},

                    sham::MultiRef{pxyz_acc, mxyz_acc, maxyz_acc, lxyz_acc},

                    Naccrete,

                    [gpart_mass, r_sink, v_sink, dt](

                        u32 id_a,

                        const Tvec *__restrict xyz,

                        const Tvec *__restrict vxyz,

                        const Tvec *__restrict axyz,

                        const u32 *__restrict id_acc,

                        Tvec *__restrict accretion_p,

                        Tvec *__restrict accretion_mr,

                        Tvec *__restrict accretion_ma,

                        Tvec *__restrict accretion_l) {

                        u32 i_a            = id_acc[id_a];

                        Tvec r             = xyz[i_a];

                        Tvec v             = vxyz[i_a];

                        Tvec a             = axyz[i_a];

                        accretion_p[id_a]  = gpart_mass * v;

                        accretion_mr[id_a] = gpart_mass * r;

                        accretion_ma[id_a] = gpart_mass * a;


                        // dirty trick to account for the residual acceleration in the spin. This

                        // allows us to maitain a much better angular momentum conservation.

                        v += a * dt / 2;

                        accretion_l[id_a] = gpart_mass * sycl::cross(r - r_sink, v - v_sink);

                    });


                Tvec acc_pxyz  = shamalgs::primitives::sum(dev_sched, pxyz_acc, 0, Naccrete);

                Tvec acc_mxyz  = shamalgs::primitives::sum(dev_sched, mxyz_acc, 0, Naccrete);

                Tvec acc_maxyz = shamalgs::primitives::sum(dev_sched, maxyz_acc, 0, Naccrete);

                Tvec acc_lxyz  = shamalgs::primitives::sum(dev_sched, lxyz_acc, 0, Naccrete);


                s_acc_mass += acc_mass;

                s_acc_pxyz += acc_pxyz;

                s_acc_mxyz += acc_mxyz;

                s_acc_maxyz += acc_maxyz;

                s_acc_lxyz += acc_lxyz;

            }

        });


        Tscal sum_acc_mass = shamalgs::collective::allreduce_sum(s_acc_mass);


        // if there is accretion continue otherwise skip that part

        if (sum_acc_mass <= 0) {

            continue;

        }


        Tvec sum_acc_pxyz  = shamalgs::collective::allreduce_sum(s_acc_pxyz);

        Tvec sum_acc_mxyz  = shamalgs::collective::allreduce_sum(s_acc_mxyz);

        Tvec sum_acc_maxyz = shamalgs::collective::allreduce_sum(s_acc_maxyz);

        Tvec sum_acc_lxyz  = shamalgs::collective::allreduce_sum(s_acc_lxyz);


        // compute the new sink values

        Tscal new_mass   = s.mass + sum_acc_mass;

        Tvec new_pos     = (sum_acc_mxyz + s.pos * s.mass) / (s.mass + sum_acc_mass);

        Tvec new_vel     = (sum_acc_pxyz + s.velocity * s.mass) / (s.mass + sum_acc_mass);

        Tvec new_acc     = (sum_acc_maxyz + s.sph_acceleration * s.mass) / (s.mass + sum_acc_mass);

        Tvec new_ang_mom = s.angular_momentum + sum_acc_lxyz

                           - new_mass * sycl::cross(new_pos - s.pos, new_vel - s.velocity);


        // write back the updated sink state

        auto new_state             = s;

        new_state.mass             = new_mass;

        new_state.pos              = new_pos;

        new_state.velocity         = new_vel;

        new_state.angular_momentum = new_ang_mom;

        new_state.sph_acceleration = new_acc;


        had_accretion = true;

        log += shambase::format(

            "\n    id {} deltas : mass={} r={} v={} l={}",

            sink_id,

            new_state.mass - s.mass,

            new_state.pos - s.pos,

            new_state.velocity - s.velocity,

            new_state.angular_momentum - s.angular_momentum);


        s = new_state;


        // evict accreted particles from patches

        scheduler().for_each_patchdata_nonempty([&](Patch cur_p, PatchDataLayer &pdat) {

            u32 Nobj = pdat.get_obj_cnt();


            sham::DeviceBuffer<u32> &not_accreted

                = accretion_flag_bufs.get(cur_p.id_patch).not_accreted;

            sham::DeviceBuffer<u32> &accreted = accretion_flag_bufs.get(cur_p.id_patch).accreted;


            sham::DeviceBuffer<u32> &id_list_accrete = bufs_id_list_accrete.get(cur_p.id_patch);


            if (id_list_accrete.get_size() > 0) {


                sham::DeviceBuffer<u32> id_list_keep

                    = shamalgs::stream_compact(dev_sched, not_accreted, Nobj);


                pdat.keep_ids(

                    id_list_keep, shambase::narrow_or_throw<u32>(id_list_keep.get_size()));

            }

        });

    }


    if (shamcomm::world_rank() == 0 && had_accretion) {

        logger::info_ln("sph::Sink", log);

    }

}


template<class Tvec, template<class> class SPHKernel>

void shammodels::sph::modules::SinkParticlesUpdate<Tvec, SPHKernel>::predictor_step(Tscal dt) {


    StackEntry stack_loc{};


    if (storage.sinks.is_empty()) {

        return;

    }


    compute_ext_forces();


    std::vector<Sink> &sink_parts = storage.sinks.get();


    for (Sink &s : sink_parts) {

        s.velocity += (dt / 2) * s.sph_acceleration;

    }


    for (Sink &s : sink_parts) {

        s.velocity += (dt / 2) * s.ext_acceleration;

    }


    for (Sink &s : sink_parts) {

        s.pos += (dt) *s.velocity;

    }


    for (Sink &s : sink_parts) {

        s.velocity += (dt / 2) * s.ext_acceleration;

    }

}


template<class Tvec, template<class> class SPHKernel>

void shammodels::sph::modules::SinkParticlesUpdate<Tvec, SPHKernel>::corrector_step(Tscal dt) {


    StackEntry stack_loc{};


    if (storage.sinks.is_empty()) {

        return;

    }


    std::vector<Sink> &sink_parts = storage.sinks.get();


    for (Sink &s : sink_parts) {

        s.velocity += (dt / 2) * s.sph_acceleration;

    }

}


template<class Tvec, template<class> class SPHKernel>

void shammodels::sph::modules::SinkParticlesUpdate<Tvec, SPHKernel>::compute_sph_forces() {


    StackEntry stack_loc{};


    Tscal gpart_mass = solver_config.gpart_mass;


    if (storage.sinks.is_empty()) {

        return;

    }


    std::vector<Sink> &sink_parts = storage.sinks.get();


    Tscal G            = solver_config.get_constant_G();

    Tscal epsilon_grav = 1e-9;


    using namespace shamrock;

    using namespace shamrock::patch;


    PatchDataLayerLayout &pdl = scheduler().pdl_old();

    const u32 ixyz            = pdl.get_field_idx<Tvec>("xyz");

    const u32 iaxyz_ext       = pdl.get_field_idx<Tvec>("axyz_ext");


    auto dev_sched       = shamsys::instance::get_compute_scheduler_ptr();

    sham::DeviceQueue &q = shambase::get_check_ref(dev_sched).get_queue();


    std::vector<Tvec> result_acc_sinks{};


    for (Sink &s : sink_parts) {


        Tvec sph_acc_sink = {};


        scheduler().for_each_patchdata_nonempty(

            [&, G, epsilon_grav, gpart_mass](Patch cur_p, PatchDataLayer &pdat) {

                sham::DeviceBuffer<Tvec> &buf_xyz      = pdat.get_field_buf_ref<Tvec>(ixyz);

                sham::DeviceBuffer<Tvec> &buf_axyz_ext = pdat.get_field_buf_ref<Tvec>(iaxyz_ext);


                sham::DeviceBuffer<Tvec> buf_sync_axyz(pdat.get_obj_cnt(), dev_sched);


                Tscal sink_mass = s.mass;

                Tscal sink_racc = s.accretion_radius;

                Tvec sink_pos   = s.pos;


                sham::EventList depends_list;

                auto xyz       = buf_xyz.get_read_access(depends_list);

                auto axyz_ext  = buf_axyz_ext.get_write_access(depends_list);

                auto axyz_sync = buf_sync_axyz.get_write_access(depends_list);


                auto e = q.submit(

                    depends_list,

                    [&, G, epsilon_grav, sink_mass, sink_pos, sink_racc](sycl::handler &cgh) {

                        shambase::parallel_for(

                            cgh, pdat.get_obj_cnt(), "sink-sph forces", [=](i32 id_a) {

                                Tvec r_a = xyz[id_a];


                                Tvec delta = r_a - sink_pos;

                                Tscal d    = sycl::length(delta);


                                Tvec force = G * delta / (d * d * d);


                                // This is a hack to avoid the sink kaboom effect

                                // when the particle is being advected close to the sink before

                                // being accreted

                                if (d < sink_racc) {

                                    force = {0, 0, 0};

                                }


                                axyz_sync[id_a] = force * gpart_mass;

                                axyz_ext[id_a] += -force * sink_mass;

                            });

                    });


                buf_xyz.complete_event_state(e);

                buf_axyz_ext.complete_event_state(e);

                buf_sync_axyz.complete_event_state(e);


                sph_acc_sink

                    += shamalgs::primitives::sum(dev_sched, buf_sync_axyz, 0, pdat.get_obj_cnt());

            });


        result_acc_sinks.push_back(sph_acc_sink);

    }


    std::vector<Tvec> gathered_result_acc_sinks{};

    shamalgs::collective::vector_allgatherv(

        result_acc_sinks, gathered_result_acc_sinks, MPI_COMM_WORLD);


    u32 id_s = 0;

    for (Sink &s : sink_parts) {


        s.sph_acceleration = {};


        for (u32 rid = 0; rid < shamcomm::world_size(); rid++) {

            s.sph_acceleration += gathered_result_acc_sinks[rid * sink_parts.size() + id_s];

        }


        id_s++;

    }

}


template<class Tvec, template<class> class SPHKernel>

void shammodels::sph::modules::SinkParticlesUpdate<Tvec, SPHKernel>::compute_ext_forces() {


    StackEntry stack_loc{};


    if (storage.sinks.is_empty()) {

        return;

    }


    std::vector<Sink> &sink_parts = storage.sinks.get();


    for (Sink &s : sink_parts) {

        s.ext_acceleration = Tvec{};

    }


    Tscal G                 = solver_config.get_constant_G();

    Tscal epsilon_grav_sink = 1e-9;


    for (Sink &s1 : sink_parts) {

        Tvec sum{};

        for (Sink &s2 : sink_parts) {

            Tvec rij       = s1.pos - s2.pos;

            Tscal rij_scal = sycl::length(rij);

            sum -= G * s2.mass * rij / (rij_scal * rij_scal * rij_scal + epsilon_grav_sink);

        }

        s1.ext_acceleration = sum;

    }

}


using namespace shammath;

template class shammodels::sph::modules::SinkParticlesUpdate<f64_3, M4>;

template class shammodels::sph::modules::SinkParticlesUpdate<f64_3, M6>;

template class shammodels::sph::modules::SinkParticlesUpdate<f64_3, M8>;


template class shammodels::sph::modules::SinkParticlesUpdate<f64_3, C2>;

template class shammodels::sph::modules::SinkParticlesUpdate<f64_3, C4>;

template class shammodels::sph::modules::SinkParticlesUpdate<f64_3, C6>;

DeviceBuffer.hpp

DistributedData.hpp

shammodels::gsph::names::newtonian::axyz
constexpr const char * axyz
3-acceleration field
Definition FieldNames.hpp:46

shammodels::gsph::names::newtonian::vxyz
constexpr const char * vxyz
3-velocity field
Definition FieldNames.hpp:43

shammodels::gsph::names::common::xyz
constexpr const char * xyz
Position field (3D coordinates)
Definition FieldNames.hpp:33

SinkParticlesUpdate.hpp

u32
std::uint32_t u32
32 bit unsigned integer
Definition aliases_int.hpp:27

i32
std::int32_t i32
32 bit integer
Definition aliases_int.hpp:23

sham::DeviceBuffer
A buffer allocated in USM (Unified Shared Memory)
Definition DeviceBuffer.hpp:106

sham::DeviceBuffer::complete_event_state
void complete_event_state(sycl::event e) const
Complete the event state of the buffer.
Definition DeviceBuffer.hpp:368

sham::DeviceBuffer::get_size
size_t get_size() const
Gets the number of elements in the buffer.
Definition DeviceBuffer.hpp:476

sham::DeviceBuffer::get_read_access
const T * get_read_access(sham::EventList &depends_list, SourceLocation src_loc=SourceLocation{}) const
Get a read-only pointer to the buffer's data.
Definition DeviceBuffer.hpp:331

sham::DeviceQueue
A SYCL queue associated with a device and a context.
Definition DeviceQueue.hpp:32

sham::DeviceQueue::submit
sycl::event submit(Fct &&fct)
Submits a kernel to the SYCL queue.
Definition DeviceQueue.hpp:101

sham::EventList
Class to manage a list of SYCL events.
Definition EventList.hpp:31

shambase::DistributedData
Represents a collection of objects distributed across patches identified by a u64 id.
Definition DistributedData.hpp:43

shammodels::sph::modules::SinkParticlesUpdate
Definition SinkParticlesUpdate.hpp:29

shamrock::patch::PatchDataLayerLayout
Definition PatchDataLayerLayout.hpp:66

shamrock::patch::PatchDataLayerLayout::get_field_idx
u32 get_field_idx(const std::string &field_name) const
Get the field id if matching name & type.
Definition PatchDataLayerLayout.hpp:349

shamrock::patch::PatchDataLayer
PatchDataLayer container class, the layout is described in patchdata_layout.
Definition PatchDataLayer.hpp:35

reduction.hpp

numeric.hpp

shamalgs::collective::vector_allgatherv
std::vector< int > vector_allgatherv(const std::vector< T > &send_vec, const MPI_Datatype &send_type, std::vector< T > &recv_vec, const MPI_Datatype &recv_type, const MPI_Comm comm)
allgatherv on vector with size query (size querying variant of vector_allgatherv_ks) //TODO add fault...
Definition exchanges.hpp:98

kernel_call.hpp

sham::kernel_call
void kernel_call(sham::DeviceQueue &q, RefIn in, RefOut in_out, u32 n, Functor &&func, SourceLocation &&callsite=SourceLocation{})
Submit a kernel to a SYCL queue.
Definition kernel_call.hpp:514

shamalgs::numeric::stream_compact
std::tuple< std::optional< sycl::buffer< u32 > >, u32 > stream_compact(sycl::queue &q, sycl::buffer< u32 > &buf_flags, u32 len)
Stream compaction algorithm.
Definition numeric.cpp:84

shamalgs::primitives::sum
T sum(const sham::DeviceScheduler_ptr &sched, const sham::DeviceBuffer< T > &buf1, u32 start_id, u32 end_id)
Compute the sum of elements in a device buffer within a specified range.
Definition reduction.cpp:105

shambase::throw_with_loc
void throw_with_loc(std::string message, SourceLocation loc=SourceLocation{})
Throw an exception and append the source location to it.
Definition exception.hpp:132

shambase::get_check_ref
T & get_check_ref(const std::unique_ptr< T > &ptr, SourceLocation loc=SourceLocation())
Takes a std::unique_ptr and returns a reference to the object it holds. It throws a std::runtime_erro...
Definition memory.hpp:110

shamcomm::world_rank
i32 world_rank()
Gives the rank of the current process in the MPI communicator.
Definition worldInfo.cpp:40

shamcomm::world_size
i32 world_size()
Gives the size of the MPI communicator.
Definition worldInfo.cpp:38

shammath
namespace for math utility
Definition AABB.hpp:26

shamrock
namespace for the main framework
Definition __init__.py:1

narrowing.hpp
Utilities for safe type narrowing conversions.

reduction.hpp

logs.hpp

sphkernels.hpp
sph kernels

sham::MultiRef
A class that references multiple buffers or similar objects.
Definition kernel_call.hpp:234

shambase::details::BasicStackEntry
Definition stacktrace.hpp:106

shamrock::patch::Patch
Patch object that contain generic patch information.
Definition Patch.hpp:33

shamrock::patch::Patch::id_patch
u64 id_patch
unique key that identify the patch
Definition Patch.hpp:86

sycl.hpp