Shamrock/doxygen/NeighbourCache_8cpp_source.html

// -------------------------------------------------------//

//

// SHAMROCK code for hydrodynamics

// Copyright (c) 2021-2026 Timothée David--Cléris <tim.shamrock@proton.me>

// SPDX-License-Identifier: CeCILL Free Software License Agreement v2.1

// Shamrock is licensed under the CeCILL 2.1 License, see LICENSE for more information

//

// -------------------------------------------------------//


#include "shambase/aliases_int.hpp"

#include "shambase/assert.hpp"

#include "shambase/memory.hpp"

#include "shambackends/DeviceBuffer.hpp"

#include "shammath/sphkernels.hpp"

#include "shammodels/sph/modules/NeighbourCache.hpp"

#include "shamsys/legacy/log.hpp"

#include "shamtree/TreeTraversal.hpp"

#include "shamtree/kernels/geometry_utils.hpp"

#include "shamunits/Constants.hpp"


template<class Tvec, class Tmorton, template<class> class SPHKernel>

void shammodels::sph::modules::NeighbourCache<Tvec, Tmorton, SPHKernel>::start_neighbors_cache() {


    // interface_control

    using GhostHandle      = sph::BasicSPHGhostHandler<Tvec>;

    using GhostHandleCache = typename GhostHandle::CacheMap;

    using RTree            = shamtree::CompressedLeafBVH<Tmorton, Tvec, 3>;


    shambase::Timer time_neigh;

    time_neigh.start();


    StackEntry stack_loc{};


    // do cache

    auto build_neigh_cache = [&](u64 patch_id) {

        shamlog_debug_ln("BasicSPH", "build particle cache id =", patch_id);


        NamedStackEntry cache_build_stack_loc{"build cache"};


        auto &mfield = storage.merged_xyzh.get().get(patch_id);


        sham::DeviceBuffer<Tvec> &buf_xyz    = mfield.template get_field_buf_ref<Tvec>(0);

        sham::DeviceBuffer<Tscal> &buf_hpart = mfield.template get_field_buf_ref<Tscal>(1);


        sham::DeviceBuffer<Tscal> &tree_field_rint

            = storage.rtree_rint_field.get().get(patch_id).buf_field;


        RTree &tree = storage.merged_pos_trees.get().get(patch_id);

        auto obj_it = tree.get_object_iterator();


        u32 obj_cnt = shambase::get_check_ref(storage.part_counts).indexes.get(patch_id);


        sycl::range range_npart{obj_cnt};


        Tscal h_tolerance = solver_config.htol_up_coarse_cycle;


        NamedStackEntry stack_loc1{"init cache"};


        using namespace shamrock;


        sham::DeviceBuffer<u32> neigh_count(

            obj_cnt, shamsys::instance::get_compute_scheduler_ptr());


        shamsys::instance::get_compute_queue().wait_and_throw();


        shamlog_debug_sycl_ln("Cache", "generate cache for N=", obj_cnt);

        {

            sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

            sham::EventList depends_list;


            auto xyz             = buf_xyz.get_read_access(depends_list);

            auto hpart           = buf_hpart.get_read_access(depends_list);

            auto rint_tree       = tree_field_rint.get_read_access(depends_list);

            auto neigh_cnt       = neigh_count.get_write_access(depends_list);

            auto particle_looper = obj_it.get_read_access(depends_list);


            auto e = q.submit(depends_list, [&, h_tolerance](sycl::handler &cgh) {

                constexpr Tscal Rker2 = Kernel::Rkern * Kernel::Rkern;


                shambase::parallel_for(cgh, obj_cnt, "compute neigh cache 1", [=](u64 gid) {

                    u32 id_a = (u32) gid;


                    Tscal rint_a = hpart[id_a] * h_tolerance;


                    Tvec xyz_a = xyz[id_a];


                    Tvec inter_box_a_min = xyz_a - rint_a * Kernel::Rkern;

                    Tvec inter_box_a_max = xyz_a + rint_a * Kernel::Rkern;


                    u32 cnt = 0;


                    particle_looper.rtree_for(

                        [&](u32 node_id, shammath::AABB<Tvec> node_aabb) -> bool {

                            Tscal int_r_max_cell = rint_tree[node_id] * Kernel::Rkern;


                            using namespace walker::interaction_crit;


                            return sph_radix_cell_crit(

                                xyz_a,

                                inter_box_a_min,

                                inter_box_a_max,

                                node_aabb.lower,

                                node_aabb.upper,

                                int_r_max_cell);

                        },

                        [&](u32 id_b) {

                            // particle_looper.for_each_object(id_a,[&](u32 id_b){

                            //  compute only omega_a

                            Tvec dr      = xyz_a - xyz[id_b];

                            Tscal rab2   = sycl::dot(dr, dr);

                            Tscal rint_b = hpart[id_b] * h_tolerance;


                            bool no_interact

                                = rab2 > rint_a * rint_a * Rker2 && rab2 > rint_b * rint_b * Rker2;


                            cnt += (no_interact) ? 0 : 1;

                        });


                    neigh_cnt[id_a] = cnt;

                });

            });


            buf_xyz.complete_event_state(e);

            buf_hpart.complete_event_state(e);

            neigh_count.complete_event_state(e);

            tree_field_rint.complete_event_state(e);

            obj_it.complete_event_state(e);

        }


        tree::ObjectCache pcache = tree::prepare_object_cache(std::move(neigh_count), obj_cnt);


        NamedStackEntry stack_loc2{"fill cache"};

        {

            sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

            sham::EventList depends_list;


            auto xyz               = buf_xyz.get_read_access(depends_list);

            auto hpart             = buf_hpart.get_read_access(depends_list);

            auto rint_tree         = tree_field_rint.get_read_access(depends_list);

            auto scanned_neigh_cnt = pcache.scanned_cnt.get_read_access(depends_list);

            auto neigh             = pcache.index_neigh_map.get_write_access(depends_list);

            auto particle_looper   = obj_it.get_read_access(depends_list);


            auto e = q.submit(depends_list, [&, h_tolerance](sycl::handler &cgh) {

                constexpr Tscal Rker2 = Kernel::Rkern * Kernel::Rkern;


                shambase::parallel_for(cgh, obj_cnt, "compute neigh cache 2", [=](u64 gid) {

                    u32 id_a = (u32) gid;


                    Tscal rint_a = hpart[id_a] * h_tolerance;


                    Tvec xyz_a = xyz[id_a];


                    Tvec inter_box_a_min = xyz_a - rint_a * Kernel::Rkern;

                    Tvec inter_box_a_max = xyz_a + rint_a * Kernel::Rkern;


                    u32 cnt = scanned_neigh_cnt[id_a];


                    particle_looper.rtree_for(

                        [&](u32 node_id, shammath::AABB<Tvec> node_aabb) -> bool {

                            Tscal int_r_max_cell = rint_tree[node_id] * Kernel::Rkern;


                            using namespace walker::interaction_crit;


                            return sph_radix_cell_crit(

                                xyz_a,

                                inter_box_a_min,

                                inter_box_a_max,

                                node_aabb.lower,

                                node_aabb.upper,

                                int_r_max_cell);

                        },

                        [&](u32 id_b) {

                            // particle_looper.for_each_object(id_a,[&](u32 id_b){

                            //  compute only omega_a

                            Tvec dr      = xyz_a - xyz[id_b];

                            Tscal rab2   = sycl::dot(dr, dr);

                            Tscal rint_b = hpart[id_b] * h_tolerance;


                            bool no_interact

                                = rab2 > rint_a * rint_a * Rker2 && rab2 > rint_b * rint_b * Rker2;


                            if (!no_interact) {

                                neigh[cnt] = id_b;

                            }

                            cnt += (no_interact) ? 0 : 1;

                        });

                });

            });


            buf_xyz.complete_event_state(e);

            buf_hpart.complete_event_state(e);

            tree_field_rint.complete_event_state(e);

            pcache.scanned_cnt.complete_event_state(e);

            pcache.index_neigh_map.complete_event_state(e);

            obj_it.complete_event_state(e);

        }


        return pcache;

    };


    shambase::get_check_ref(storage.neigh_cache).free_alloc();


    using namespace shamrock::patch;

    scheduler().for_each_patchdata_nonempty([&](Patch cur_p, PatchDataLayer &pdat) {

        auto &ncache = shambase::get_check_ref(storage.neigh_cache);

        ncache.neigh_cache.add_obj(cur_p.id_patch, build_neigh_cache(cur_p.id_patch));

    });


    time_neigh.end();

    storage.timings_details.neighbors += time_neigh.elasped_sec();

}


template<class Tvec, class Tmorton, template<class> class SPHKernel>

void shammodels::sph::modules::NeighbourCache<Tvec, Tmorton, SPHKernel>::

    start_neighbors_cache_2stages() {


    // interface_control

    using GhostHandle      = sph::BasicSPHGhostHandler<Tvec>;

    using GhostHandleCache = typename GhostHandle::CacheMap;

    using RTree            = shamtree::CompressedLeafBVH<Tmorton, Tvec, 3>;


    shambase::Timer time_neigh;

    time_neigh.start();


    StackEntry stack_loc{};


    // do cache

    auto build_neigh_cache = [&](u64 patch_id) {

        shamlog_debug_ln("BasicSPH", "build particle cache id =", patch_id);


        NamedStackEntry cache_build_stack_loc{"build cache"};


        auto &mfield = storage.merged_xyzh.get().get(patch_id);


        sham::DeviceBuffer<Tvec> &buf_xyz    = mfield.template get_field_buf_ref<Tvec>(0);

        sham::DeviceBuffer<Tscal> &buf_hpart = mfield.template get_field_buf_ref<Tscal>(1);


        sham::DeviceBuffer<Tscal> &tree_field_rint

            = storage.rtree_rint_field.get().get(patch_id).buf_field;


        RTree &tree  = storage.merged_pos_trees.get().get(patch_id);

        auto obj_it  = tree.get_object_iterator();

        auto leaf_it = tree.get_traverser();


        u32 leaf_cnt    = tree.get_leaf_cell_count();

        u32 intnode_cnt = tree.get_internal_cell_count();


        u32 obj_cnt = shambase::get_check_ref(storage.part_counts).indexes.get(patch_id);


        sycl::range range_nleaf{leaf_cnt};

        sycl::range range_nobj{obj_cnt};

        using namespace shamrock;


        Tscal h_tolerance = solver_config.htol_up_coarse_cycle;


        NamedStackEntry stack_loc1{"init cache"};


        // start by counting number of leaf neighbours


        sham::DeviceBuffer<u32> neigh_count_leaf(

            leaf_cnt, shamsys::instance::get_compute_scheduler_ptr());


        shamsys::instance::get_compute_queue().wait_and_throw();


        shamlog_debug_sycl_ln("Cache", "generate cache for Nleaf=", leaf_cnt);


        {

            sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

            sham::EventList depends_list;


            auto xyz         = buf_xyz.get_read_access(depends_list);

            auto hpart       = buf_hpart.get_read_access(depends_list);

            auto rint_tree   = tree_field_rint.get_read_access(depends_list);

            auto neigh_cnt   = neigh_count_leaf.get_write_access(depends_list);

            auto leaf_looper = leaf_it.get_read_access(depends_list);


            auto e = q.submit(depends_list, [&, h_tolerance](sycl::handler &cgh) {

                u32 offset_leaf = intnode_cnt;


                shambase::parallel_for(cgh, leaf_cnt, "compute neigh cache 1", [=](u64 gid) {

                    u32 id_a = (u32) gid;


                    Tscal leaf_a_rint    = rint_tree[offset_leaf + gid] * Kernel::Rkern;

                    Tvec leaf_a_bmin     = leaf_looper.aabb_min[offset_leaf + gid];

                    Tvec leaf_a_bmax     = leaf_looper.aabb_max[offset_leaf + gid];

                    Tvec leaf_a_bmin_ext = leaf_a_bmin - leaf_a_rint;

                    Tvec leaf_a_bmax_ext = leaf_a_bmax + leaf_a_rint;


                    u32 cnt = 0;


                    leaf_looper.rtree_for(

                        [&](u32 node_id, shammath::AABB<Tvec> node_aabb) -> bool {

                            Tscal int_r_max_cell = rint_tree[node_id] * Kernel::Rkern;


                            Tvec ext_bmin = node_aabb.lower - int_r_max_cell;

                            Tvec ext_bmax = node_aabb.upper + int_r_max_cell;


                            return BBAA::cella_neigh_b(leaf_a_bmin, leaf_a_bmax, ext_bmin, ext_bmax)

                                   || BBAA::cella_neigh_b(

                                       leaf_a_bmin_ext,

                                       leaf_a_bmax_ext,

                                       node_aabb.lower,

                                       node_aabb.upper);

                        },

                        [&](u32 leaf_b) {

                            cnt++;

                        });


                    neigh_cnt[id_a] = cnt;

                });

            });


            buf_xyz.complete_event_state(e);

            buf_hpart.complete_event_state(e);

            tree_field_rint.complete_event_state(e);

            neigh_count_leaf.complete_event_state(e);

            leaf_it.complete_event_state(e);

        }


        //{

        //    u32 offset_leaf = intnode_cnt;

        //    sycl::host_accessor neigh_cnt{neigh_count_leaf};

        //    sycl::host_accessor pos_min_cell

        //    {shambase::get_check_ref(tree.tree_cell_ranges.buf_pos_min_cell_flt)};

        //    sycl::host_accessor pos_max_cell

        //    {shambase::get_check_ref(tree.tree_cell_ranges.buf_pos_max_cell_flt)};

        //

        //    for (u32 i = 0; i < 1000; i++) {

        //        if(neigh_cnt[i] > 30){

        //            logger::raw_ln(i, neigh_cnt[i], pos_max_cell[i+offset_leaf] -

        //            pos_min_cell[i+offset_leaf]);

        //        }

        //    }

        //}


        tree::ObjectCache pleaf_cache

            = tree::prepare_object_cache(std::move(neigh_count_leaf), leaf_cnt);


        // fill ids of leaf neighbours


        NamedStackEntry stack_loc2{"fill cache"};


        {

            sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

            sham::EventList depends_list;


            auto xyz               = buf_xyz.get_read_access(depends_list);

            auto hpart             = buf_hpart.get_read_access(depends_list);

            auto rint_tree         = tree_field_rint.get_read_access(depends_list);

            auto scanned_neigh_cnt = pleaf_cache.scanned_cnt.get_read_access(depends_list);

            auto neigh             = pleaf_cache.index_neigh_map.get_write_access(depends_list);

            auto leaf_looper       = leaf_it.get_read_access(depends_list);


            auto e = q.submit(depends_list, [&, h_tolerance](sycl::handler &cgh) {

                u32 offset_leaf = intnode_cnt;


                shambase::parallel_for(cgh, leaf_cnt, "compute neigh cache 2", [=](u64 gid) {

                    u32 id_a = (u32) gid;


                    Tscal leaf_a_rint    = rint_tree[offset_leaf + gid] * Kernel::Rkern;

                    Tvec leaf_a_bmin     = leaf_looper.aabb_min[offset_leaf + gid];

                    Tvec leaf_a_bmax     = leaf_looper.aabb_max[offset_leaf + gid];

                    Tvec leaf_a_bmin_ext = leaf_a_bmin - leaf_a_rint;

                    Tvec leaf_a_bmax_ext = leaf_a_bmax + leaf_a_rint;


                    u32 cnt = scanned_neigh_cnt[id_a];


                    leaf_looper.rtree_for(

                        [&](u32 node_id, shammath::AABB<Tvec> node_aabb) -> bool {

                            Tscal int_r_max_cell = rint_tree[node_id] * Kernel::Rkern;


                            Tvec ext_bmin = node_aabb.lower - int_r_max_cell;

                            Tvec ext_bmax = node_aabb.upper + int_r_max_cell;


                            return BBAA::cella_neigh_b(leaf_a_bmin, leaf_a_bmax, ext_bmin, ext_bmax)

                                   || BBAA::cella_neigh_b(

                                       leaf_a_bmin_ext,

                                       leaf_a_bmax_ext,

                                       node_aabb.lower,

                                       node_aabb.upper);

                        },

                        [&](u32 leaf_b) {

                            neigh[cnt] = leaf_b;

                            cnt++;

                        });

                });

            });


            buf_xyz.complete_event_state(e);

            buf_hpart.complete_event_state(e);

            tree_field_rint.complete_event_state(e);

            pleaf_cache.scanned_cnt.complete_event_state(e);

            pleaf_cache.index_neigh_map.complete_event_state(e);

            leaf_it.complete_event_state(e);

        }

        // search in which leaf each parts are

        sycl::buffer<u32> leaf_part_id(obj_cnt);


        {

            sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

            sham::EventList depends_list;


            auto xyz         = buf_xyz.get_read_access(depends_list);

            auto leaf_looper = leaf_it.get_read_access(depends_list);


            auto e = q.submit(depends_list, [&, h_tolerance](sycl::handler &cgh) {

                sycl::accessor found_id{leaf_part_id, cgh, sycl::write_only, sycl::no_init};

                u32 offset_leaf = intnode_cnt;

                // sycl::stream out {4096,4096,cgh};

                shambase::parallel_for(cgh, obj_cnt, "search particles parent leaf", [=](u64 gid) {

                    u32 id_a = (u32) gid;


                    Tvec r_a = xyz[id_a];


                    u32 found_id_ = i32_max; // to ensure a crash because of out of bound

                                             // access if not found


                    leaf_looper.rtree_for(

                        [&](u32 node_id, shammath::AABB<Tvec> node_aabb) -> bool {

                            bool ret = BBAA::is_coord_in_range_incl_max(

                                r_a, node_aabb.lower, node_aabb.upper);


                            // error : i= 44245 r=

                            // (0.3495433344162232,-0.005627362002766546,-0.21312104638358176)

                            // leaf_id= 2147483647 if(id_a == 44245) {out << node_id << " "

                            // << bmin

                            // << " " << bmax << " " << ret << "\n";};

                            return ret;

                        },

                        [&](u32 leaf_b) {

                            found_id_ = leaf_b - offset_leaf;

                        });


                    SHAM_ASSERT(found_id_ < offset_leaf + 1);


                    found_id[id_a] = found_id_;

                });

            });


            buf_xyz.complete_event_state(e);

            leaf_it.complete_event_state(e);

        }


        //{

        //    sycl::host_accessor xyz{buf_xyz};

        //    sycl::host_accessor acc {leaf_part_id};

        //

        //    for(u32 i = 0; i < obj_cnt; i++){

        //        u32 leaf_id = acc[i];

        //        if(leaf_id >= leaf_cnt){

        //            logger::raw_ln("error : i=",i,"r=",xyz[i],"leaf_id=",leaf_id);

        //        }

        //    }

        //}


        sham::DeviceBuffer<u32> neigh_count(

            obj_cnt, shamsys::instance::get_compute_scheduler_ptr());


        shamsys::instance::get_compute_queue().wait_and_throw();


        shamlog_debug_sycl_ln("Cache", "generate cache for N=", obj_cnt);


        {

            sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

            sham::EventList depends_list;


            auto xyz                   = buf_xyz.get_read_access(depends_list);

            auto hpart                 = buf_hpart.get_read_access(depends_list);

            auto acc_neigh_leaf_looper = pleaf_cache.get_read_access(depends_list);

            auto neigh_cnt             = neigh_count.get_write_access(depends_list);

            auto particle_looper       = obj_it.cell_iterator.get_read_access(depends_list);


            auto e = q.submit(depends_list, [&, h_tolerance](sycl::handler &cgh) {

                tree::ObjectCacheIterator neigh_leaf_looper(acc_neigh_leaf_looper);


                sycl::accessor leaf_owner{leaf_part_id, cgh, sycl::read_only};


                u32 offset_leaf = intnode_cnt;

                // sycl::stream out {4096,1024,cgh};


                constexpr Tscal Rker2 = Kernel::Rkern * Kernel::Rkern;


                shambase::parallel_for(cgh, obj_cnt, "compute neigh cache 1", [=](u64 gid) {

                    u32 id_a = (u32) gid;


                    Tscal rint_a = hpart[id_a] * h_tolerance;


                    Tvec xyz_a = xyz[id_a];


                    u32 cnt = 0;


                    u32 leaf_own_a = leaf_owner[id_a];


                    neigh_leaf_looper.for_each_object(leaf_own_a, [&](u32 leaf_b) {

                        SHAM_ASSERT(leaf_b >= offset_leaf);


                        particle_looper.for_each_in_leaf_cell(leaf_b - offset_leaf, [&](u32 id_b) {

                            Tvec dr      = xyz_a - xyz[id_b];

                            Tscal rab2   = sycl::dot(dr, dr);

                            Tscal rint_b = hpart[id_b] * h_tolerance;


                            bool no_interact

                                = rab2 > rint_a * rint_a * Rker2 && rab2 > rint_b * rint_b * Rker2;


                            cnt += (no_interact) ? 0 : 1;

                        });

                    });


                    neigh_cnt[id_a] = cnt;

                });

            });


            buf_xyz.complete_event_state(e);

            buf_hpart.complete_event_state(e);

            pleaf_cache.complete_event_state(e);

            neigh_count.complete_event_state(e);

            obj_it.cell_iterator.complete_event_state(e);

        }


        tree::ObjectCache pcache = tree::prepare_object_cache(std::move(neigh_count), obj_cnt);


        NamedStackEntry stack_loc3{"fill cache"};


        {

            sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

            sham::EventList depends_list;


            auto xyz                   = buf_xyz.get_read_access(depends_list);

            auto hpart                 = buf_hpart.get_read_access(depends_list);

            auto acc_neigh_leaf_looper = pleaf_cache.get_read_access(depends_list);

            auto scanned_neigh_cnt     = pcache.scanned_cnt.get_read_access(depends_list);

            auto neigh                 = pcache.index_neigh_map.get_write_access(depends_list);

            auto particle_looper       = obj_it.cell_iterator.get_read_access(depends_list);


            auto e = q.submit(depends_list, [&, h_tolerance](sycl::handler &cgh) {

                tree::ObjectCacheIterator neigh_leaf_looper(acc_neigh_leaf_looper);


                sycl::accessor leaf_owner{leaf_part_id, cgh, sycl::read_only};


                u32 offset_leaf = intnode_cnt;


                constexpr Tscal Rker2 = Kernel::Rkern * Kernel::Rkern;


                shambase::parallel_for(cgh, obj_cnt, "compute neigh cache 2", [=](u64 gid) {

                    u32 id_a = (u32) gid;


                    Tscal rint_a = hpart[id_a] * h_tolerance;


                    Tvec xyz_a = xyz[id_a];


                    u32 cnt = scanned_neigh_cnt[id_a];


                    u32 leaf_own_a = leaf_owner[id_a];


                    neigh_leaf_looper.for_each_object(leaf_own_a, [&](u32 leaf_b) {

                        SHAM_ASSERT(leaf_b >= offset_leaf);


                        particle_looper.for_each_in_leaf_cell(leaf_b - offset_leaf, [&](u32 id_b) {

                            Tvec dr      = xyz_a - xyz[id_b];

                            Tscal rab2   = sycl::dot(dr, dr);

                            Tscal rint_b = hpart[id_b] * h_tolerance;


                            bool no_interact

                                = rab2 > rint_a * rint_a * Rker2 && rab2 > rint_b * rint_b * Rker2;


                            if (!no_interact) {

                                neigh[cnt] = id_b;

                            }

                            cnt += (no_interact) ? 0 : 1;

                        });

                    });

                });

            });


            buf_xyz.complete_event_state(e);

            buf_hpart.complete_event_state(e);

            pleaf_cache.complete_event_state(e);

            pcache.scanned_cnt.complete_event_state(e);

            pcache.index_neigh_map.complete_event_state(e);

            obj_it.cell_iterator.complete_event_state(e);

        }

        return pcache;

    };


    shambase::get_check_ref(storage.neigh_cache).free_alloc();


    using namespace shamrock::patch;

    scheduler().for_each_patchdata_nonempty([&](Patch cur_p, PatchDataLayer &pdat) {

        auto &ncache = shambase::get_check_ref(storage.neigh_cache);

        ncache.neigh_cache.add_obj(cur_p.id_patch, build_neigh_cache(cur_p.id_patch));

    });


    time_neigh.end();

    storage.timings_details.neighbors += time_neigh.elasped_sec();

}


using namespace shammath;

template class shammodels::sph::modules::NeighbourCache<f64_3, u32, M4>;

template class shammodels::sph::modules::NeighbourCache<f64_3, u32, M6>;

template class shammodels::sph::modules::NeighbourCache<f64_3, u32, M8>;


template class shammodels::sph::modules::NeighbourCache<f64_3, u32, C2>;

template class shammodels::sph::modules::NeighbourCache<f64_3, u32, C4>;

template class shammodels::sph::modules::NeighbourCache<f64_3, u32, C6>;

Constants.hpp

DeviceBuffer.hpp

shammodels::gsph::names::common::xyz
constexpr const char * xyz
Position field (3D coordinates)
Definition FieldNames.hpp:33

shammodels::gsph::names::common::hpart
constexpr const char * hpart
Smoothing length field.
Definition FieldNames.hpp:34

NeighbourCache.hpp

shamsys::instance::get_compute_queue
sycl::queue & get_compute_queue(u32 id=0)
Definition NodeInstance.cpp:370

TreeTraversal.hpp

aliases_int.hpp

u32
std::uint32_t u32
32 bit unsigned integer
Definition aliases_int.hpp:27

u64
std::uint64_t u64
64 bit unsigned integer
Definition aliases_int.hpp:26

assert.hpp
Shamrock assertion utility.

SHAM_ASSERT
#define SHAM_ASSERT(x)
Shorthand for SHAM_ASSERT_NAMED without a message.
Definition assert.hpp:67

sham::DeviceBuffer
A buffer allocated in USM (Unified Shared Memory)
Definition DeviceBuffer.hpp:106

sham::DeviceBuffer::complete_event_state
void complete_event_state(sycl::event e) const
Complete the event state of the buffer.
Definition DeviceBuffer.hpp:368

sham::DeviceBuffer::get_write_access
T * get_write_access(sham::EventList &depends_list, SourceLocation src_loc=SourceLocation{})
Get a read-write pointer to the buffer's data.
Definition DeviceBuffer.hpp:349

sham::DeviceBuffer::get_read_access
const T * get_read_access(sham::EventList &depends_list, SourceLocation src_loc=SourceLocation{}) const
Get a read-only pointer to the buffer's data.
Definition DeviceBuffer.hpp:331

sham::DeviceQueue
A SYCL queue associated with a device and a context.
Definition DeviceQueue.hpp:32

sham::DeviceQueue::submit
sycl::event submit(Fct &&fct)
Submits a kernel to the SYCL queue.
Definition DeviceQueue.hpp:101

sham::DeviceScheduler::get_queue
DeviceQueue & get_queue(u32 id=0)
Get a reference to a DeviceQueue.
Definition DeviceScheduler.cpp:57

sham::EventList
Class to manage a list of SYCL events.
Definition EventList.hpp:31

shambase::Timer
Class Timer measures the time elapsed since the timer was started.
Definition time.hpp:96

shambase::Timer::end
void end()
Stops the timer and stores the elapsed time in nanoseconds.
Definition time.hpp:111

shambase::Timer::elasped_sec
f64 elasped_sec() const
Converts the stored nanosecond time to a floating point representation in seconds.
Definition time.hpp:123

shambase::Timer::start
void start()
Starts the timer.
Definition time.hpp:106

shammodels::sph::modules::NeighbourCache
Definition NeighbourCache.hpp:28

shamrock::patch::PatchDataLayer
PatchDataLayer container class, the layout is described in patchdata_layout.
Definition PatchDataLayer.hpp:35

shamrock.tree::ObjectCacheIterator
Definition TreeTraversal.hpp:487

shamtree::CompressedLeafBVH
A Compressed Leaf Bounding Volume Hierarchy (CLBVH) for neighborhood queries.
Definition CompressedLeafBVH.hpp:46

geometry_utils.hpp

log.hpp

shambase::get_check_ref
T & get_check_ref(const std::unique_ptr< T > &ptr, SourceLocation loc=SourceLocation())
Takes a std::unique_ptr and returns a reference to the object it holds. It throws a std::runtime_erro...
Definition memory.hpp:110

shammath
namespace for math utility
Definition AABB.hpp:26

shamrock
namespace for the main framework
Definition __init__.py:1

i32_max
constexpr i32 i32_max
i32 max value
Definition numeric_limits.hpp:66

memory.hpp

sphkernels.hpp
sph kernels

shambase::details::BasicStackEntry
Definition stacktrace.hpp:106

shambase::details::NamedBasicStackEntry
Definition stacktrace.hpp:170

shammath::AABB
Axis-Aligned bounding box.
Definition AABB.hpp:99

shammath::AABB::lower
T lower
Lower bound of the AABB.
Definition AABB.hpp:104

shammath::AABB::upper
T upper
Upper bound of the AABB.
Definition AABB.hpp:105

shamrock::patch::Patch
Patch object that contain generic patch information.
Definition Patch.hpp:33

shamrock::patch::Patch::id_patch
u64 id_patch
unique key that identify the patch
Definition Patch.hpp:86

shamrock.tree::ObjectCache
Definition TreeTraversal.hpp:375