From bd5adb919fe2ea5bef5fb775887ec107e5b23778 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jean-No=C3=ABl=20Grad?= <jgrad@icp.uni-stuttgart.de>
Date: Mon, 11 Nov 2024 19:16:05 +0100
Subject: [PATCH] Fix PackInfo codegen

---
 .../pystencils_walberla/templates/CpuPackInfo.tmpl.h | 12 ++++++++++--
 .../pystencils_walberla/templates/GpuPackInfo.tmpl.h |  2 +-
 src/communication/UniformPackInfo.h                  |  8 ++++++++
 3 files changed, 19 insertions(+), 3 deletions(-)

diff --git a/python/pystencils_walberla/templates/CpuPackInfo.tmpl.h b/python/pystencils_walberla/templates/CpuPackInfo.tmpl.h
index 66114de6e..716da0445 100644
--- a/python/pystencils_walberla/templates/CpuPackInfo.tmpl.h
+++ b/python/pystencils_walberla/templates/CpuPackInfo.tmpl.h
@@ -25,6 +25,8 @@
 #include "domain_decomposition/IBlock.h"
 #include "communication/UniformPackInfo.h"
 
+#include <memory>
+
 #define FUNC_PREFIX
 
 #ifdef __GNUC__
@@ -52,7 +54,10 @@ public:
 
    void unpackData(IBlock * receiver, stencil::Direction dir, mpi::RecvBuffer & buffer) {
         const auto dataSize = size(dir, receiver);
-        unpack(dir, buffer.skip(dataSize), receiver);
+        auto bufferSize = dataSize + sizeof({{dtype}});
+        auto bufferPtr = reinterpret_cast<void*>(buffer.skip(bufferSize));
+        std::align(alignof({{dtype}}), dataSize, bufferPtr, bufferSize);
+        unpack(dir, reinterpret_cast<unsigned char*>(bufferPtr), receiver);
    }
 
    void communicateLocal(const IBlock * sender, IBlock * receiver, stencil::Direction dir) {
@@ -65,7 +70,10 @@ public:
 
    void packDataImpl(const IBlock * sender, stencil::Direction dir, mpi::SendBuffer & outBuffer) const {
         const auto dataSize = size(dir, sender);
-        pack(dir, outBuffer.forward(dataSize), const_cast<IBlock*>(sender));
+        auto bufferSize = dataSize + sizeof({{dtype}});
+        auto bufferPtr = reinterpret_cast<void*>(outBuffer.forward(bufferSize));
+        std::align(alignof({{dtype}}), dataSize, bufferPtr, bufferSize);
+        pack(dir, reinterpret_cast<unsigned char*>(bufferPtr), const_cast<IBlock *>(sender));
    }
 
    void pack  (stencil::Direction dir, unsigned char * buffer, IBlock * block) const;
diff --git a/python/pystencils_walberla/templates/GpuPackInfo.tmpl.h b/python/pystencils_walberla/templates/GpuPackInfo.tmpl.h
index b301bced5..cd5b23677 100644
--- a/python/pystencils_walberla/templates/GpuPackInfo.tmpl.h
+++ b/python/pystencils_walberla/templates/GpuPackInfo.tmpl.h
@@ -59,7 +59,7 @@ public:
     void pack  (stencil::Direction dir, unsigned char * buffer, IBlock * block, gpuStream_t stream) override;
     void communicateLocal  ( stencil::Direction /*dir*/, const IBlock* /* sender */, IBlock* /* receiver */, gpuStream_t /* stream */ ) override
     {
-       WALBERLA_ABORT("Local Communication not implemented yet for standard PackInfos. To run your application turn of local communication in the Communication class")
+       WALBERLA_ABORT("Local Communication not implemented yet for standard PackInfos. To run your application, turn off local communication in the communication class, e.g. with useLocalCommunication=false")
     }
     void unpack(stencil::Direction dir, unsigned char * buffer, IBlock * block, gpuStream_t stream) override;
     uint_t size  (stencil::Direction dir, IBlock * block) override;
diff --git a/src/communication/UniformPackInfo.h b/src/communication/UniformPackInfo.h
index 168ce9685..dd35b0087 100644
--- a/src/communication/UniformPackInfo.h
+++ b/src/communication/UniformPackInfo.h
@@ -100,6 +100,10 @@ public:
     *
     * If NOT thread-safe, \ref threadsafeReceiving must return false!
     *
+    * Implementations must reserve extra space and advance the send buffer
+    * pointer according to the alignment of the ghost layer data type!
+    * The buffer is char-aligned.
+    *
     * @param receiver the block where the unpacked data should be stored into
     * @param dir      receive data from neighbor in this direction
     * @param buffer   buffer for reading the data from
@@ -145,6 +149,10 @@ protected:
     *
     * Must be thread-safe!
     *
+    * Implementations must reserve extra space and advance the send buffer
+    * pointer according to the alignment of the ghost layer data type!
+    * The buffer is char-aligned.
+    *
     * @param sender     the block whose data should be packed into a buffer
     * @param dir        pack data for neighbor in this direction
     * @param buffer     buffer for writing the data into
-- 
GitLab