Shamrock/doxygen/AMRGridRefinementHandler_8cpp_source.html

// -------------------------------------------------------//

//

// SHAMROCK code for hydrodynamics

// Copyright (c) 2021-2026 Timothée David--Cléris <tim.shamrock@proton.me>

// SPDX-License-Identifier: CeCILL Free Software License Agreement v2.1

// Shamrock is licensed under the CeCILL 2.1 License, see LICENSE for more information

//

// -------------------------------------------------------//


#include "shammodels/ramses/modules/AMRGridRefinementHandler.hpp"

#include "shamalgs/details/algorithm/algorithm.hpp"

#include "shamcomm/logs.hpp"

#include "shammodels/ramses/modules/AMRSortBlocks.hpp"

#include <stdexcept>


template<class Tvec, class TgridVec>

template<class UserAcc, class... T>

void shammodels::basegodunov::modules::AMRGridRefinementHandler<Tvec, TgridVec>::

    gen_refine_block_changes(

        shambase::DistributedData<sham::DeviceBuffer<u32>> &dd_refine_list,

        shambase::DistributedData<sham::DeviceBuffer<u32>> &dd_derefine_list,

        T &&...args) {


    using namespace shamrock::patch;


    u64 tot_refine   = 0;

    u64 tot_derefine = 0;


    sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

    auto dev_sched       = shamsys::instance::get_compute_scheduler_ptr();


    scheduler().for_each_patchdata_nonempty([&](Patch cur_p, PatchDataLayer &pdat) {

        u64 id_patch = cur_p.id_patch;


        // create the refine and derefine flags buffers

        u32 obj_cnt = pdat.get_obj_cnt();


        sham::DeviceBuffer<u32> refine_flags(obj_cnt, dev_sched);

        sham::DeviceBuffer<u32> derefine_flags(obj_cnt, dev_sched);


        {

            sham::EventList depends_list;


            UserAcc uacc(depends_list, id_patch, cur_p, pdat, args...);


            auto refine_acc   = refine_flags.get_write_access(depends_list);

            auto derefine_acc = derefine_flags.get_write_access(depends_list);


            // fill in the flags

            auto e = q.submit(depends_list, [&](sycl::handler &cgh) {

                cgh.parallel_for(sycl::range<1>(obj_cnt), [=](sycl::item<1> gid) {

                    bool flag_refine   = false;

                    bool flag_derefine = false;

                    uacc.refine_criterion(gid.get_linear_id(), uacc, flag_refine, flag_derefine);


                    // This is just a safe guard to avoid this nonsensicall case

                    if (flag_refine && flag_derefine) {

                        flag_derefine = false;

                    }


                    refine_acc[gid]   = (flag_refine) ? 1 : 0;

                    derefine_acc[gid] = (flag_derefine) ? 1 : 0;

                });

            });


            sham::EventList resulting_events;

            resulting_events.add_event(e);


            refine_flags.complete_event_state(resulting_events);

            derefine_flags.complete_event_state(resulting_events);


            uacc.finalize(resulting_events, id_patch, cur_p, pdat, args...);

        }


        sham::DeviceBuffer<TgridVec> &buf_cell_min = pdat.get_field_buf_ref<TgridVec>(0);

        sham::DeviceBuffer<TgridVec> &buf_cell_max = pdat.get_field_buf_ref<TgridVec>(1);


        sham::EventList depends_list;

        auto acc_min        = buf_cell_min.get_read_access(depends_list);

        auto acc_max        = buf_cell_max.get_read_access(depends_list);

        auto acc_merge_flag = derefine_flags.get_write_access(depends_list);


        // keep only derefine flags on only if the eight cells want to merge and if they can

        auto e = q.submit(depends_list, [&](sycl::handler &cgh) {

            cgh.parallel_for(sycl::range<1>(obj_cnt), [=](sycl::item<1> gid) {

                u32 id = gid.get_linear_id();


                std::array<BlockCoord, split_count> blocks;

                bool do_merge = true;


                // This avoid the case where we are in the last block of the buffer to avoid the

                // out-of-bound read

                if (id + split_count <= obj_cnt) {

                    bool all_want_to_merge = true;


                    for (u32 lid = 0; lid < split_count; lid++) {

                        blocks[lid]       = BlockCoord{acc_min[gid + lid], acc_max[gid + lid]};

                        all_want_to_merge = all_want_to_merge && acc_merge_flag[gid + lid];

                    }


                    do_merge = all_want_to_merge && BlockCoord::are_mergeable(blocks);


                } else {

                    do_merge = false;

                }


                acc_merge_flag[gid] = do_merge;

            });

        });


        buf_cell_min.complete_event_state(e);

        buf_cell_max.complete_event_state(e);

        derefine_flags.complete_event_state(e);


        // refinement


        // perform stream compactions on the refinement flags

        auto buf_refine = shamalgs::numeric::stream_compact(dev_sched, refine_flags, obj_cnt);


        shamlog_debug_ln(

            "AMRGrid", "patch ", id_patch, "refine block count = ", buf_refine.get_size());


        tot_refine += buf_refine.get_size();


        // add the results to the map

        dd_refine_list.add_obj(id_patch, std::move(buf_refine));


        // derefinement


        // perform stream compactions on the derefinement flags

        auto buf_derefine = shamalgs::numeric::stream_compact(dev_sched, derefine_flags, obj_cnt);


        shamlog_debug_ln(

            "AMRGrid", "patch ", id_patch, "merge block count = ", buf_derefine.get_size());


        tot_derefine += buf_derefine.get_size();


        // add the results to the map

        dd_derefine_list.add_obj(id_patch, std::move(buf_derefine));

    });


    logger::info_ln("AMRGrid", "on this process", tot_refine, "blocks were refined");

    logger::info_ln(

        "AMRGrid", "on this process", tot_derefine * split_count, "blocks were derefined");

}

template<class Tvec, class TgridVec>

template<class UserAcc>

bool shammodels::basegodunov::modules::AMRGridRefinementHandler<Tvec, TgridVec>::

    internal_refine_grid(shambase::DistributedData<sham::DeviceBuffer<u32>> &&dd_refine_list) {


    using namespace shamrock::patch;


    u64 sum_block_count = 0;


    bool new_cell_were_added = false;


    scheduler().for_each_patch_data([&](u64 id_patch, Patch cur_p, PatchDataLayer &pdat) {

        sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();


        u32 old_obj_cnt = pdat.get_obj_cnt();


        sham::DeviceBuffer<u32> &refine_flags = dd_refine_list.get(id_patch);


        if (refine_flags.get_size() > 0) {


            // alloc memory for the new blocks to be created

            pdat.expand(refine_flags.get_size() * (split_count - 1));


            sham::DeviceBuffer<TgridVec> &buf_cell_min = pdat.get_field_buf_ref<TgridVec>(0);

            sham::DeviceBuffer<TgridVec> &buf_cell_max = pdat.get_field_buf_ref<TgridVec>(1);


            sham::EventList depends_list;

            auto block_bound_low  = buf_cell_min.get_write_access(depends_list);

            auto block_bound_high = buf_cell_max.get_write_access(depends_list);

            UserAcc uacc(depends_list, pdat);

            auto index_to_ref = refine_flags.get_read_access(depends_list);


            // Refine the block (set the positions) and fill the corresponding fields

            auto e = q.submit(depends_list, [&](sycl::handler &cgh) {

                u32 start_index_push = old_obj_cnt;


                constexpr u32 new_splits = split_count - 1;


                cgh.parallel_for(sycl::range<1>(refine_flags.get_size()), [=](sycl::item<1> gid) {

                    u32 tid = gid.get_linear_id();


                    u32 idx_to_refine = index_to_ref[tid];


                    // gen splits coordinates

                    BlockCoord cur_block{

                        block_bound_low[idx_to_refine], block_bound_high[idx_to_refine]};


                    std::array<BlockCoord, split_count> block_coords

                        = BlockCoord::get_split(cur_block.bmin, cur_block.bmax);


                    // generate index for the refined blocks

                    std::array<u32, split_count> blocks_ids;

                    blocks_ids[0] = idx_to_refine;


                    // generate index for the new blocks (the current index is reused for the first

                    // new block, the others are pushed at the end of the patchdata)

#pragma unroll

                    for (u32 pid = 0; pid < new_splits; pid++) {

                        blocks_ids[pid + 1] = start_index_push + tid * new_splits + pid;

                    }


                    // write coordinates


#pragma unroll

                    for (u32 pid = 0; pid < split_count; pid++) {

                        block_bound_low[blocks_ids[pid]]  = block_coords[pid].bmin;

                        block_bound_high[blocks_ids[pid]] = block_coords[pid].bmax;

                    }


                    // user lambda to fill the fields

                    uacc.apply_refine(idx_to_refine, cur_block, blocks_ids, block_coords, uacc);

                });

            });


            sham::EventList resulting_events{e};


            buf_cell_min.complete_event_state(resulting_events);

            buf_cell_max.complete_event_state(resulting_events);


            uacc.finalize(resulting_events, pdat);


            refine_flags.complete_event_state(resulting_events);

        }


        sum_block_count += pdat.get_obj_cnt();

        new_cell_were_added = new_cell_were_added || refine_flags.get_size() > 0;

    });


    logger::info_ln("AMRGrid", "process block count =", sum_block_count);


    return new_cell_were_added;

}


template<class Tvec, class TgridVec>

template<class UserAcc>

bool shammodels::basegodunov::modules::AMRGridRefinementHandler<Tvec, TgridVec>::

    internal_derefine_grid(shambase::DistributedData<sham::DeviceBuffer<u32>> &&dd_derefine_list) {


    using namespace shamrock::patch;


    bool cell_were_removed = false;


    sham::DeviceQueue &q = shamsys::instance::get_compute_scheduler().get_queue();

    auto dev_sched       = shamsys::instance::get_compute_scheduler_ptr();


    scheduler().for_each_patch_data([&](u64 id_patch, Patch cur_p, PatchDataLayer &pdat) {

        u32 old_obj_cnt = pdat.get_obj_cnt();


        sham::DeviceBuffer<u32> &derefine_flags = dd_derefine_list.get(id_patch);


        if (derefine_flags.get_size() > 0) {


            // init flag table

            sham::DeviceBuffer<u32> keep_block_flag(old_obj_cnt, dev_sched);

            keep_block_flag.fill(1);


            sham::DeviceBuffer<TgridVec> &buf_cell_min = pdat.get_field_buf_ref<TgridVec>(0);

            sham::DeviceBuffer<TgridVec> &buf_cell_max = pdat.get_field_buf_ref<TgridVec>(1);


            sham::EventList depends_list;

            auto block_bound_low  = buf_cell_min.get_write_access(depends_list);

            auto block_bound_high = buf_cell_max.get_write_access(depends_list);

            UserAcc uacc(depends_list, pdat);

            auto index_to_deref = derefine_flags.get_read_access(depends_list);

            auto flag_keep      = keep_block_flag.get_write_access(depends_list);


            // edit block content + make flag of blocks to keep

            auto e = q.submit(depends_list, [&](sycl::handler &cgh) {

                cgh.parallel_for(sycl::range<1>(derefine_flags.get_size()), [=](sycl::item<1> gid) {

                    u32 tid = gid.get_linear_id();


                    u32 idx_to_derefine = index_to_deref[gid];


                    // compute old block indexes

                    std::array<u32, split_count> old_indexes;

#pragma unroll

                    for (u32 pid = 0; pid < split_count; pid++) {

                        old_indexes[pid] = idx_to_derefine + pid;

                    }


                    // load block coords

                    std::array<BlockCoord, split_count> block_coords;

#pragma unroll

                    for (u32 pid = 0; pid < split_count; pid++) {

                        block_coords[pid] = BlockCoord{

                            block_bound_low[old_indexes[pid]], block_bound_high[old_indexes[pid]]};

                    }


                    // make new block coord

                    BlockCoord merged_block_coord = BlockCoord::get_merge(block_coords);


                    // write new coord

                    block_bound_low[idx_to_derefine]  = merged_block_coord.bmin;

                    block_bound_high[idx_to_derefine] = merged_block_coord.bmax;


// flag the old blocks for removal

#pragma unroll

                    for (u32 pid = 1; pid < split_count; pid++) {

                        flag_keep[idx_to_derefine + pid] = 0;

                    }


                    // user lambda to fill the fields

                    uacc.apply_derefine(

                        old_indexes, block_coords, idx_to_derefine, merged_block_coord, uacc);

                });

            });


            sham::EventList resulting_events{e};


            buf_cell_min.complete_event_state(resulting_events);

            buf_cell_max.complete_event_state(resulting_events);


            uacc.finalize(resulting_events, pdat);


            keep_block_flag.complete_event_state(resulting_events);

            derefine_flags.complete_event_state(resulting_events);


            // stream compact the flags

            auto buf_keep

                = shamalgs::numeric::stream_compact(dev_sched, keep_block_flag, old_obj_cnt);


            shamlog_debug_ln(

                "AMR Grid",

                "patch",

                id_patch,

                "derefine block count ",

                old_obj_cnt,

                "->",

                buf_keep.get_size());


            if (buf_keep.get_size() == 0) {

                throw std::runtime_error("buf keep must contain something at this point");

            }


            // remap pdat according to stream compact

            pdat.index_remap_resize(buf_keep, buf_keep.get_size());


            cell_were_removed = cell_were_removed || derefine_flags.get_size() > 0;

        }

    });


    return cell_were_removed;

}


template<class Tvec, class TgridVec>

template<class UserAccCrit, class UserAccSplit, class UserAccMerge>

void shammodels::basegodunov::modules::AMRGridRefinementHandler<Tvec, TgridVec>::

    internal_update_refinement() {


    // Ensure that the blocks are sorted before refinement

    AMRSortBlocks block_sorter(context, solver_config, storage);

    block_sorter.reorder_amr_blocks();


    // get refine and derefine list

    shambase::DistributedData<sham::DeviceBuffer<u32>> dd_refine_list;

    shambase::DistributedData<sham::DeviceBuffer<u32>> dd_derefine_list;


    gen_refine_block_changes<UserAccCrit>(dd_refine_list, dd_derefine_list);


    // Note that this only add new blocks at the end of the patchdata

    internal_refine_grid<UserAccSplit>(std::move(dd_refine_list));


    // Note that this will perform the merge then remove the old blocks

    // This is ok to call straight after the refine without edditing the index list in derefine_list

    // since no permutations were applied in internal_refine_grid and no cells can be both refined

    // and derefined in the same pass

    internal_derefine_grid<UserAccMerge>(std::move(dd_derefine_list));

}


template<class Tvec, class TgridVec>

void shammodels::basegodunov::modules::AMRGridRefinementHandler<Tvec, TgridVec>::

    update_refinement() {


    class RefineCritBlock {

        public:

        const TgridVec *block_low_bound;

        const TgridVec *block_high_bound;

        const Tscal *block_density_field;


        Tscal one_over_Nside = 1. / AMRBlock::Nside;


        Tscal dxfact;

        Tscal wanted_mass;


        RefineCritBlock(

            sham::EventList &depends_list,

            u64 id_patch,

            shamrock::patch::Patch p,

            shamrock::patch::PatchDataLayer &pdat,

            Tscal dxfact,

            Tscal wanted_mass)

            : dxfact(dxfact), wanted_mass(wanted_mass) {


            block_low_bound  = pdat.get_field<TgridVec>(0).get_buf().get_read_access(depends_list);

            block_high_bound = pdat.get_field<TgridVec>(1).get_buf().get_read_access(depends_list);

            block_density_field = pdat.get_field<Tscal>(pdat.pdl().get_field_idx<Tscal>("rho"))

                                      .get_buf()

                                      .get_read_access(depends_list);

        }


        void finalize(

            sham::EventList &resulting_events,

            u64 id_patch,

            shamrock::patch::Patch p,

            shamrock::patch::PatchDataLayer &pdat,

            Tscal dxfact,

            Tscal wanted_mass) {


            sham::DeviceBuffer<i64_3> &buf_cell_low_bound  = pdat.get_field<i64_3>(0).get_buf();

            sham::DeviceBuffer<i64_3> &buf_cell_high_bound = pdat.get_field<i64_3>(1).get_buf();


            buf_cell_low_bound.complete_event_state(resulting_events);

            buf_cell_high_bound.complete_event_state(resulting_events);

            pdat.get_field<Tscal>(pdat.pdl().get_field_idx<Tscal>("rho"))

                .get_buf()

                .complete_event_state(resulting_events);

        }


        void refine_criterion(

            u32 block_id, RefineCritBlock acc, bool &should_refine, bool &should_derefine) const {


            TgridVec low_bound  = acc.block_low_bound[block_id];

            TgridVec high_bound = acc.block_high_bound[block_id];


            Tvec lower_flt = low_bound.template convert<Tscal>() * dxfact;

            Tvec upper_flt = high_bound.template convert<Tscal>() * dxfact;


            Tvec block_cell_size = (upper_flt - lower_flt) * one_over_Nside;


            Tscal sum_mass = 0;

            for (u32 i = 0; i < AMRBlock::block_size; i++) {

                sum_mass += acc.block_density_field[i + block_id * AMRBlock::block_size];

            }

            sum_mass *= block_cell_size.x() * block_cell_size.y() * block_cell_size.z();


            if (sum_mass > wanted_mass * 8) {

                should_refine   = true;

                should_derefine = false;

            } else if (sum_mass < wanted_mass) {

                should_refine   = false;

                should_derefine = true;

            } else {

                should_refine   = false;

                should_derefine = false;

            }


            should_refine = should_refine && (high_bound.x() - low_bound.x() > AMRBlock::Nside);

            should_refine = should_refine && (high_bound.y() - low_bound.y() > AMRBlock::Nside);

            should_refine = should_refine && (high_bound.z() - low_bound.z() > AMRBlock::Nside);

        }

    };


    class RefineCellAccessor {

        public:

        f64 *rho;

        f64_3 *rho_vel;

        f64 *rhoE;


        RefineCellAccessor(sham::EventList &depends_list, shamrock::patch::PatchDataLayer &pdat) {


            rho     = pdat.get_field<f64>(2).get_buf().get_write_access(depends_list);

            rho_vel = pdat.get_field<f64_3>(3).get_buf().get_write_access(depends_list);

            rhoE    = pdat.get_field<f64>(4).get_buf().get_write_access(depends_list);

        }


        void finalize(sham::EventList &resulting_events, shamrock::patch::PatchDataLayer &pdat) {

            pdat.get_field<f64>(2).get_buf().complete_event_state(resulting_events);

            pdat.get_field<f64_3>(3).get_buf().complete_event_state(resulting_events);

            pdat.get_field<f64>(4).get_buf().complete_event_state(resulting_events);

        }


        void apply_refine(

            u32 cur_idx,

            BlockCoord cur_coords,

            std::array<u32, 8> new_blocks,

            std::array<BlockCoord, 8> new_block_coords,

            RefineCellAccessor acc) const {


            auto get_coord_ref = [](u32 i) -> std::array<u32, dim> {

                constexpr u32 NsideBlockPow = 1;

                constexpr u32 Nside         = 1U << NsideBlockPow;


                if constexpr (dim == 3) {

                    const u32 tmp = i >> NsideBlockPow;

                    return {i % Nside, (tmp) % Nside, (tmp) >> NsideBlockPow};

                }

            };


            auto get_index_block = [](std::array<u32, dim> coord) -> u32 {

                constexpr u32 NsideBlockPow = 1;

                constexpr u32 Nside         = 1U << NsideBlockPow;


                if constexpr (dim == 3) {

                    return coord[0] + Nside * coord[1] + Nside * Nside * coord[2];

                }

            };


            auto get_gid_write = [&](std::array<u32, dim> &glid) -> u32 {

                std::array<u32, dim> bid

                    = {glid[0] >> AMRBlock::NsideBlockPow,

                       glid[1] >> AMRBlock::NsideBlockPow,

                       glid[2] >> AMRBlock::NsideBlockPow};


                // logger::raw_ln(glid,bid);

                return new_blocks[get_index_block(bid)] * AMRBlock::block_size

                       + AMRBlock::get_index(

                           {glid[0] % AMRBlock::Nside,

                            glid[1] % AMRBlock::Nside,

                            glid[2] % AMRBlock::Nside});

            };


            std::array<f64, AMRBlock::block_size> old_rho_block;

            std::array<f64_3, AMRBlock::block_size> old_rho_vel_block;

            std::array<f64, AMRBlock::block_size> old_rhoE_block;


            // save old block

            for (u32 loc_id = 0; loc_id < AMRBlock::block_size; loc_id++) {


                auto [lx, ly, lz]         = get_coord_ref(loc_id);

                u32 old_cell_idx          = cur_idx * AMRBlock::block_size + loc_id;

                old_rho_block[loc_id]     = acc.rho[old_cell_idx];

                old_rho_vel_block[loc_id] = acc.rho_vel[old_cell_idx];

                old_rhoE_block[loc_id]    = acc.rhoE[old_cell_idx];

            }


            for (u32 loc_id = 0; loc_id < AMRBlock::block_size; loc_id++) {


                auto [lx, ly, lz] = get_coord_ref(loc_id);

                u32 old_cell_idx  = cur_idx * AMRBlock::block_size + loc_id;


                Tscal rho_block    = old_rho_block[loc_id];

                Tvec rho_vel_block = old_rho_vel_block[loc_id];

                Tscal rhoE_block   = old_rhoE_block[loc_id];

                for (u32 subdiv_lid = 0; subdiv_lid < 8; subdiv_lid++) {


                    auto [sx, sy, sz] = get_coord_ref(subdiv_lid);


                    std::array<u32, 3> glid = {lx * 2 + sx, ly * 2 + sy, lz * 2 + sz};


                    u32 new_cell_idx = get_gid_write(glid);

                    /*

                                        if (1627 == cur_idx) {

                                            logger::raw_ln(

                                                cur_idx,

                                                "set cell ",

                                                new_cell_idx,

                                                " from cell",

                                                old_cell_idx,

                                                "old",

                                                rho_block,

                                                rho_vel_block,

                                                rhoE_block);

                                        }

                                        */

                    acc.rho[new_cell_idx]     = rho_block;

                    acc.rho_vel[new_cell_idx] = rho_vel_block;

                    acc.rhoE[new_cell_idx]    = rhoE_block;

                }

            }

        }


        void apply_derefine(

            std::array<u32, 8> old_blocks,

            std::array<BlockCoord, 8> old_coords,

            u32 new_cell,

            BlockCoord new_coord,


            RefineCellAccessor acc) const {


            std::array<f64, AMRBlock::block_size> rho_block;

            std::array<f64_3, AMRBlock::block_size> rho_vel_block;

            std::array<f64, AMRBlock::block_size> rhoE_block;


            for (u32 cell_id = 0; cell_id < AMRBlock::block_size; cell_id++) {

                rho_block[cell_id]     = {};

                rho_vel_block[cell_id] = {};

                rhoE_block[cell_id]    = {};

            }


            for (u32 pid = 0; pid < 8; pid++) {

                for (u32 cell_id = 0; cell_id < AMRBlock::block_size; cell_id++) {

                    rho_block[cell_id] += acc.rho[old_blocks[pid] * AMRBlock::block_size + cell_id];

                    rho_vel_block[cell_id]

                        += acc.rho_vel[old_blocks[pid] * AMRBlock::block_size + cell_id];

                    rhoE_block[cell_id]

                        += acc.rhoE[old_blocks[pid] * AMRBlock::block_size + cell_id];

                }

            }


            for (u32 cell_id = 0; cell_id < AMRBlock::block_size; cell_id++) {

                rho_block[cell_id] /= 8;

                rho_vel_block[cell_id] /= 8;

                rhoE_block[cell_id] /= 8;

            }


            for (u32 cell_id = 0; cell_id < AMRBlock::block_size; cell_id++) {

                u32 newcell_idx          = new_cell * AMRBlock::block_size + cell_id;

                acc.rho[newcell_idx]     = rho_block[cell_id];

                acc.rho_vel[newcell_idx] = rho_vel_block[cell_id];

                acc.rhoE[newcell_idx]    = rhoE_block[cell_id];

            }

        }

    };


    using AMRmode_None         = typename AMRMode<Tvec, TgridVec>::None;

    using AMRmode_DensityBased = typename AMRMode<Tvec, TgridVec>::DensityBased;


    bool has_cell_order_changed = false;


    if (AMRmode_None *cfg = std::get_if<AMRmode_None>(&solver_config.amr_mode.config)) {

        // no refinment here turn around there is nothing to see

    } else if (

        AMRmode_DensityBased *cfg

        = std::get_if<AMRmode_DensityBased>(&solver_config.amr_mode.config)) {

        Tscal dxfact(solver_config.grid_coord_to_pos_fact);


        // get refine and derefine list

        shambase::DistributedData<sham::DeviceBuffer<u32>> refine_list;

        shambase::DistributedData<sham::DeviceBuffer<u32>> derefine_list;


        gen_refine_block_changes<RefineCritBlock>(

            refine_list, derefine_list, dxfact, cfg->crit_mass);


        // Note that this only add new blocks at the end of the patchdata

        bool change_refine = internal_refine_grid<RefineCellAccessor>(std::move(refine_list));


        // Note that this will perform the merge then remove the old blocks

        // This is ok to call straight after the refine without edditing the index list in

        // derefine_list since no permutations were applied in internal_refine_grid and no cells can

        // be both refined and derefined in the same pass

        bool change_derefine = internal_derefine_grid<RefineCellAccessor>(std::move(derefine_list));


        has_cell_order_changed = has_cell_order_changed || (change_refine || change_derefine);

    }


    if (has_cell_order_changed) {

        // Ensure that the blocks are sorted before refinement

        AMRSortBlocks block_sorter(context, solver_config, storage);

        block_sorter.reorder_amr_blocks();

    }

}


template class shammodels::basegodunov::modules::AMRGridRefinementHandler<f64_3, i64_3>;

AMRGridRefinementHandler.hpp

AMRSortBlocks.hpp

f64
double f64
Alias for double.
Definition aliases_float.hpp:20

u32
std::uint32_t u32
32 bit unsigned integer
Definition aliases_int.hpp:27

u64
std::uint64_t u64
64 bit unsigned integer
Definition aliases_int.hpp:26

sham::DeviceBuffer
A buffer allocated in USM (Unified Shared Memory)
Definition DeviceBuffer.hpp:106

sham::DeviceBuffer::complete_event_state
void complete_event_state(sycl::event e) const
Complete the event state of the buffer.
Definition DeviceBuffer.hpp:368

sham::DeviceBuffer::get_write_access
T * get_write_access(sham::EventList &depends_list, SourceLocation src_loc=SourceLocation{})
Get a read-write pointer to the buffer's data.
Definition DeviceBuffer.hpp:349

sham::DeviceBuffer::get_size
size_t get_size() const
Gets the number of elements in the buffer.
Definition DeviceBuffer.hpp:476

sham::DeviceBuffer::get_read_access
const T * get_read_access(sham::EventList &depends_list, SourceLocation src_loc=SourceLocation{}) const
Get a read-only pointer to the buffer's data.
Definition DeviceBuffer.hpp:331

sham::DeviceQueue
A SYCL queue associated with a device and a context.
Definition DeviceQueue.hpp:32

sham::DeviceQueue::submit
sycl::event submit(Fct &&fct)
Submits a kernel to the SYCL queue.
Definition DeviceQueue.hpp:101

sham::DeviceScheduler::get_queue
DeviceQueue & get_queue(u32 id=0)
Get a reference to a DeviceQueue.
Definition DeviceScheduler.cpp:57

sham::EventList
Class to manage a list of SYCL events.
Definition EventList.hpp:31

sham::EventList::add_event
void add_event(sycl::event e)
Add an event to the list of events.
Definition EventList.hpp:87

shambase::DistributedData
Represents a collection of objects distributed across patches identified by a u64 id.
Definition DistributedData.hpp:43

shammodels::basegodunov::modules::AMRGridRefinementHandler
Definition AMRGridRefinementHandler.hpp:28

shamrock::patch::PatchDataLayerLayout::get_field_idx
u32 get_field_idx(const std::string &field_name) const
Get the field id if matching name & type.
Definition PatchDataLayerLayout.hpp:349

shamrock::patch::PatchDataLayer
PatchDataLayer container class, the layout is described in patchdata_layout.
Definition PatchDataLayer.hpp:35

shamrock::patch::PatchDataLayer::index_remap_resize
void index_remap_resize(sycl::buffer< u32 > &index_map, u32 len)
this function remaps the patchdatafield like so val[id] = val[index_map[id]] This function can be use...
Definition PatchDataLayer.cpp:187

algorithm.hpp
main include file for the shamalgs algorithms

shamalgs::numeric::stream_compact
std::tuple< std::optional< sycl::buffer< u32 > >, u32 > stream_compact(sycl::queue &q, sycl::buffer< u32 > &buf_flags, u32 len)
Stream compaction algorithm.
Definition numeric.cpp:84

shamcmdopt::args
std::vector< std::string_view > args
Executable argument list (mapped from argv)
Definition cmdopt.cpp:63

logs.hpp

shamrock::patch::Patch
Patch object that contain generic patch information.
Definition Patch.hpp:33

shamrock::patch::Patch::id_patch
u64 id_patch
unique key that identify the patch
Definition Patch.hpp:86