From 8b3ade73997e9f87f1232b9dc9af35969e6f50dd Mon Sep 17 00:00:00 2001 From: "Claudius \"keldu\" Holeksa" Date: Mon, 19 Jan 2026 13:35:25 +0100 Subject: Rewriting parts to handle different ghost layers --- examples/cavity_2d_gpu/cavity_2d_gpu.cpp | 2 +- examples/heterogeneous_computing/SConscript | 2 +- .../heterogeneous_computing.cpp | 36 ------- examples/heterogeneous_computing/sim.cpp | 96 +++++++++++++++++ examples/poiseulle_particles_2d_gpu/sim.cpp | 11 +- lib/core/c++/chunk.hpp | 38 +++++++ lib/core/c++/common.hpp | 11 ++ lib/core/c++/descriptor.hpp | 4 + lib/core/c++/lbm.hpp | 3 - lib/sycl/.nix/derivation.nix | 4 +- lib/sycl/c++/common.hpp | 12 +++ lib/sycl/c++/data.hpp | 117 +++++++++++++++++++++ lib/sycl/c++/sycl.hpp | 4 + 13 files changed, 295 insertions(+), 45 deletions(-) delete mode 100644 examples/heterogeneous_computing/heterogeneous_computing.cpp create mode 100644 examples/heterogeneous_computing/sim.cpp create mode 100644 lib/core/c++/chunk.hpp create mode 100644 lib/core/c++/common.hpp create mode 100644 lib/sycl/c++/common.hpp create mode 100644 lib/sycl/c++/data.hpp create mode 100644 lib/sycl/c++/sycl.hpp diff --git a/examples/cavity_2d_gpu/cavity_2d_gpu.cpp b/examples/cavity_2d_gpu/cavity_2d_gpu.cpp index 507c2d6..0fc490a 100644 --- a/examples/cavity_2d_gpu/cavity_2d_gpu.cpp +++ b/examples/cavity_2d_gpu/cavity_2d_gpu.cpp @@ -319,7 +319,7 @@ int main(){ auto& lbm_dir = eo_lbm_dir.get_value(); auto out_dir = lbm_dir / "cavity_gpu_2d"; - acpp::sycl::queue sycl_q{acpp::sycl::default_selector_v, acpp::sycl::property::queue::in_order{}}; + sycl::queue sycl_q{sycl::default_selector_v, sycl::property::queue::in_order{}}; constexpr size_t num_cells = dim_x * dim_y; diff --git a/examples/heterogeneous_computing/SConscript b/examples/heterogeneous_computing/SConscript index 1e52d88..226185b 100644 --- a/examples/heterogeneous_computing/SConscript +++ b/examples/heterogeneous_computing/SConscript @@ -22,7 +22,7 @@ env.headers += examples_env.headers; # Cavity2D examples_objects = []; -examples_env.add_source_files(examples_objects, ['heterogeneous_computing.cpp'], shared=False); +examples_env.add_source_files(examples_objects, ['sim.cpp'], shared=False); examples_env.heterogeneous_computing = examples_env.Program('#bin/heterogeneous_computing', [examples_objects]); # Set Alias diff --git a/examples/heterogeneous_computing/heterogeneous_computing.cpp b/examples/heterogeneous_computing/heterogeneous_computing.cpp deleted file mode 100644 index 8a79354..0000000 --- a/examples/heterogeneous_computing/heterogeneous_computing.cpp +++ /dev/null @@ -1,36 +0,0 @@ -#include -#include - - -namespace kel { -namespace lbm { -namespace sch { -using namespace saw::schema; -using KelConfig = Struct< - Member ->; -} -} - -saw::error_or lbm_main(int argc, char** argv){ - return saw::make_void(); -} -} - -int main(int argc, char** argv){ - auto eov = kel::lbm_main(argc, argv); - if(eov.is_error()){ - auto& err = eov.get_error(); - auto err_msg = err.get_message(); - std::cerr<<"[Error]: "< +#include + +#include + +namespace kel { +namespace lbm { +namespace sch { +using namespace saw::schema; + +/** + * struct lbm_data { + * std::array, 64u*64u> dfs; + * std::array info; + * }; + * + * which leads to the form + * + * template + * struct lbm_data { + * std::array, Size*Size> dfs; + * std::array info; + * }; + * + * which transferred into sycl requires us to go to + * + * template + * struct lbm_sycl_data { + * std::array* dfs; + * uint8_t* info; + * }; + * + * in data form on host + * + * template + * using LbmData = Struct< + * Member, Size*Size>, "dfs">, + * Member, "info"> + * >; + * + * If we specialize the encode::Sycl data type, then we get + * With a helper class we can copy single values back and forth and the whole block is guaranteed + * to be allocated. And this one can be dynamic while the host definition might be compile time. + * + * template<...> + * class data,encode::Sycl> final { + * saw::data> meta; + * saw::data>* dfs; + * saw::data* info; + * }; + */ + +template +using CellStruct = Struct< + Member,Desc::D, "dfs">, + Member, "dfs_old">, + Member +>; + +} +template +saw::error_or simulate(int argc, char** argv, + const saw::data>& meta +{ + constexpr auto cell_size = sizeof(saw::data>); + + auto lbm_data = saw::heap,Desc::D, 64u>>>{meta}; + + return saw::make_void(); +} + +} + +saw::error_or lbm_main(int argc, char** argv){ + using namespace lbm; + return simulate(argc, argv); +} +} + +int main(int argc, char** argv){ + auto eov = kel::lbm_main(argc, argv); + if(eov.is_error()){ + auto& err = eov.get_error(); + auto err_msg = err.get_message(); + std::cerr<<"[Error]: "< kel_main(int argc, char** argv){ uint64_t x_d = 256u; uint64_t y_d = 64u; saw::data> meta{{x_d,y_d}}; + saw::data,Desc::D>> lbm_data{meta}; acpp::sycl::queue sycl_q; - sycl_q.wait(); + { + auto eov = setup_initial_conditions(lbm_data); + if(eov.is_error()){ + return eov; + } + } + + return saw::make_void(); } @@ -71,4 +79,3 @@ int main(int argc, char** argv){ } return 0; } -} diff --git a/lib/core/c++/chunk.hpp b/lib/core/c++/chunk.hpp new file mode 100644 index 0000000..bfef358 --- /dev/null +++ b/lib/core/c++/chunk.hpp @@ -0,0 +1,38 @@ +#pragma once + +#include "common.hpp" + +namespace kel { +namespace lbm { +namespace sch { +namespace impl { +template +struct chunk_schema_type_helper { + using Schema = typename chunk_schema_type_helper::Schema; +}; + +template +struct chunk_schema_type_helper { + using Schema = FixedArray; +}; +} + + +template +struct Chunk { + using InnerSchema = typename impl::chunk_schema_type_helper::Schema; +}; + +template +using SuperChunk = Array; +} +} +} + +namespace saw { +template +class data,Encode> final { +private: +public: +}; +} diff --git a/lib/core/c++/common.hpp b/lib/core/c++/common.hpp new file mode 100644 index 0000000..5f7129f --- /dev/null +++ b/lib/core/c++/common.hpp @@ -0,0 +1,11 @@ +#pragma once + +#include + +namespace kel { +namespace lbm { +namespace sch { +using namespace saw::schema; +} +} +} diff --git a/lib/core/c++/descriptor.hpp b/lib/core/c++/descriptor.hpp index c6938e3..9cc2591 100644 --- a/lib/core/c++/descriptor.hpp +++ b/lib/core/c++/descriptor.hpp @@ -15,6 +15,10 @@ struct Descriptor { static constexpr uint64_t Q = QV; }; +using D2Q9 = Descriptor<2u,9u>; +//using D2Q5 = Descriptor<2u,5u>; +using D3Q27 = Descriptor<3u,27u>; + template struct Cell { using Descriptor = Desc; diff --git a/lib/core/c++/lbm.hpp b/lib/core/c++/lbm.hpp index 473ca69..aff38e9 100644 --- a/lib/core/c++/lbm.hpp +++ b/lib/core/c++/lbm.hpp @@ -19,9 +19,6 @@ #include namespace kel { -namespace sch { -using namespace saw::schema; -} namespace lbm { template void print_lbm_meta(const converter& conv, const saw::data>& kin_vis_si){ diff --git a/lib/sycl/.nix/derivation.nix b/lib/sycl/.nix/derivation.nix index 68fbab7..02032ba 100644 --- a/lib/sycl/.nix/derivation.nix +++ b/lib/sycl/.nix/derivation.nix @@ -5,7 +5,7 @@ , pname , version , forstio -, kel-lbm +, kel , adaptive-cpp }: @@ -27,7 +27,7 @@ stdenv.mkDerivation { forstio.codec-json forstio.remote forstio.remote-sycl - kel-lbm.core + kel.lbm.core adaptive-cpp ]; diff --git a/lib/sycl/c++/common.hpp b/lib/sycl/c++/common.hpp new file mode 100644 index 0000000..8ff76fc --- /dev/null +++ b/lib/sycl/c++/common.hpp @@ -0,0 +1,12 @@ +#pragma once + +#include +#include + +namespace kel { +namespace lbm { +namespace sycl { +using namespace acpp::sycl; +} +} +} diff --git a/lib/sycl/c++/data.hpp b/lib/sycl/c++/data.hpp new file mode 100644 index 0000000..67422e2 --- /dev/null +++ b/lib/sycl/c++/data.hpp @@ -0,0 +1,117 @@ +#pragma once + +#include "common.hpp" + +namespace kel { +namespace lbm { +namespace encode { +template +struct Sycl { +}; +} + +namespace impl { +template +struct struct_has_only_equal_dimension_array +} +} +} + +namespace saw { +template +class data, Keys>...>, kel::lbm::encode::Sycl> final { +public: + static constexpr data*...>; +private: + + /** + * @todo Check by static assert that the members all have the same dimensions. Alternatively + * Do it here by specializing. + */ + StorageT members_; + kel::lbm::sycl::queue* q_; +public: + data(): + members_{}, + q_{nullptr} + {} + + ~data(){ + SAW_ASSERT(q_){ + exit(-1); + } + std::visit([this](auto arg){ + if(not arg){ + return; + } + sycl::free(arg,*q_); + arg = nullptr; + },members_); + } + + template + auto* get_ptr(){ + return std::get::value(members_); + } + + template + auto& get(){ + auto ptr = get_ptr(); + SAW_ASSERT(ptr); + return *ptr; + } + + void set_queue(kel::lbm::sycl::queue& q){ + q_ = &q; + } +}; + +} + +namespace kel { +namespace lbm { +namespace impl { +template +struct sycl_malloc_struct_helper; + +template +struct sycl_malloc_struct_helper, Encode> final { + template + static saw::error_or allocate_on_device_member(typename data>::StorageT& storage, sycl::queue& q){ + if constexpr (i < sizeof...(Members)){ + auto& ptr = std::get(storage); + + return allocate_on_device_member(sycl_data,q); + } + + return saw::make_void(); + } + + static saw::error_or allocate_on_device(data>& sycl_data, sycl::queue& q){ + typename data>::StorageT storage; + return allocate_on_device_member<0u>(storage,q); + } +}; +} +class device final { +private: + sycl::queue q_; + + SAW_FORBID_COPY(device); + SAW_FORBID_MOVE(device); +public: + device() = default; + ~device() = default; + + template + saw::error_or allocate_on_device(data>& sycl_data){ + auto eov = sycl_malloc_struct_helper::allocate_on_device(sycl_data, q_); + if(eov.is_error()){ + return eov; + } + sycl_data.set_queue(q_); + } +}; +} +} diff --git a/lib/sycl/c++/sycl.hpp b/lib/sycl/c++/sycl.hpp new file mode 100644 index 0000000..8ddc3cd --- /dev/null +++ b/lib/sycl/c++/sycl.hpp @@ -0,0 +1,4 @@ +#pragma once + +#include "common.hpp" +#include "data.hpp" -- cgit v1.2.3