reserved enough size in the fifo buffer to reorder all added proper 4 byte alignment

2025-07-12 19:01:50 +02:00 · 2025-03-18 21:42:34 +01:00
parent e0a48e1e75
commit f056f9d31b
4 changed files with 75 additions and 36 deletions
--- a/slsReceiverSoftware/src/DataProcessor.cpp
+++ b/slsReceiverSoftware/src/DataProcessor.cpp
@ -26,6 +26,49 @@

 namespace sls {

+// TODO: move somewhere else
+template <typename T> struct AlignedData {
+    T *ptr; // Aligned data pointer
+    std::unique_ptr<std::aligned_storage_t<sizeof(T), alignof(T)>[]> buffer;
+
+    AlignedData(
+        T *p,
+        std::unique_ptr<std::aligned_storage_t<sizeof(T), alignof(T)>[]> buf)
+        : ptr(p), buffer(std::move(buf)) {}
+};
+
+// TODO: should not be in this file any suggestions to move it to a more
+// appropriate file?
+// TODO: Add unit test
+/*
+ * AlignData
+ * Aligns data to a given type T with proper alignment
+ * @param data: pointer to data
+ * @param size: size of data to align in bytes
+ * @return: aligned data
+ */
+template <typename T>
+void AlignData(AlignedData<T> &aligneddata, char *data, size_t size) {
+    using AlignedBuffer =
+        typename std::aligned_storage<sizeof(T), alignof(T)>::type;
+    std::unique_ptr<AlignedBuffer[]> tempbuffer;
+
+    if (reinterpret_cast<uintptr_t>(data) % alignof(uint64_t) == 0) {
+        // If aligned directly cast to pointer
+
+        aligneddata.ptr = reinterpret_cast<T *>(data);
+
+    } else {
+        // Allocate a temporary buffer with proper alignment
+        tempbuffer = std::make_unique<AlignedBuffer[]>(size / sizeof(T));
+        // size = ctbDigitaldbt;
+
+        std::memcpy(tempbuffer.get(), data, size);
+        aligneddata.buffer = std::move(tempbuffer);
+        aligneddata.ptr = reinterpret_cast<T *>(aligneddata.buffer.get());
+    }
+}
+
 const std::string DataProcessor::typeName = "DataProcessor";

 DataProcessor::DataProcessor(int index) : ThreadObject(index, typeName) {
@ -574,26 +617,11 @@ void DataProcessor::Reorder(size_t &size, char *data) {
    }

    // make sure data is aligned to 8 bytes before casting to uint64_t
-    char *ptr = data + nAnalogDataBytes + ctbDbitOffset;
-    uint64_t *source = nullptr;
-    using AlignedBuffer =
-        std::aligned_storage<sizeof(uint64_t), alignof(uint64_t)>::type;
-    std::unique_ptr<AlignedBuffer[]> tempbuffer;
+    AlignedData<uint64_t> aligned_data(nullptr, nullptr);
+    AlignData<uint64_t>(aligned_data, data + nAnalogDataBytes + ctbDbitOffset,
+                        ctbDigitalDataBytes);

-    if (reinterpret_cast<uintptr_t>(ptr) % alignof(uint64_t) == 0) {
-        // If aligned, directly cast to uint64_t pointer
-        source = reinterpret_cast<uint64_t *>(ptr);
-    } else {
-        // Allocate a temporary buffer with proper alignment
-        tempbuffer = std::make_unique<AlignedBuffer[]>(ctbDigitalDataBytes /
-                                                       sizeof(uint64_t));
-
-        std::memcpy(tempbuffer.get(), ptr, ctbDigitalDataBytes);
-        source = reinterpret_cast<uint64_t *>(tempbuffer.get());
-    }
-
-    // auto *source = (uint64_t *)(data + nAnalogDataBytes + ctbDbitOffset);
-    //  TODO: leads to unaligned data
+    uint64_t *source = aligned_data.ptr;

    const size_t numDigitalSamples = (ctbDigitalDataBytes / sizeof(uint64_t));

@ -612,13 +640,10 @@ void DataProcessor::Reorder(size_t &size, char *data) {

    int bitoffset = 0;
    // reorder
-    int count = 0;
-    int written = 0;
    for (size_t bi = 0; bi < 64; ++bi) {

        if (bitoffset != 0) {
            bitoffset = 0;
-            ++count;
            ++dest;
        }

@ -628,10 +653,8 @@ void DataProcessor::Reorder(size_t &size, char *data) {
            ++bitoffset;
            if (bitoffset == 8) {
                bitoffset = 0;
-                ++count;
                ++dest;
            }
-            ++written;
        }
    }

@ -671,7 +694,13 @@ void DataProcessor::ArrangeDbitData(size_t &size, char *data) {
        return;
    }

-    auto *source = (uint64_t *)(data + nAnalogDataBytes + ctbDbitOffset);
+    AlignedData<uint64_t> aligned_data(nullptr, nullptr);
+    AlignData<uint64_t>(aligned_data, data + nAnalogDataBytes + ctbDbitOffset,
+                        ctbDigitalDataBytes);
+
+    uint64_t *source = aligned_data.ptr;
+
+    // auto *source = (uint64_t *)(data + nAnalogDataBytes + ctbDbitOffset);

    const int numDigitalSamples = (ctbDigitalDataBytes / sizeof(uint64_t));

@ -747,19 +776,19 @@ void DataProcessor::ArrangeDbitData(size_t &size, char *data) {
        }
    }

-    // copy back to memory and update size
-    memcpy(data + nAnalogDataBytes, result.data(),
-           totalNumBytes * sizeof(uint8_t));
-
    size = totalNumBytes * sizeof(uint8_t) + nAnalogDataBytes +
           nTransceiverDataBytes;

    // check if size changed, if so move transceiver data to avoid gap in memory
-    if (size < nAnalogDataBytes + nDigitalDataBytes + nTransceiverDataBytes)
+    if (size != nAnalogDataBytes + nDigitalDataBytes + nTransceiverDataBytes)
        memmove(data + nAnalogDataBytes + totalNumBytes * sizeof(uint8_t),
                data + nAnalogDataBytes + nDigitalDataBytes,
                nTransceiverDataBytes);

+    // copy back to memory and update size
+    memcpy(data + nAnalogDataBytes, result.data(),
+           totalNumBytes * sizeof(uint8_t));
+
    LOG(logDEBUG1) << "totalNumBytes: " << totalNumBytes
                   << " nAnalogDataBytes:" << nAnalogDataBytes
                   << " ctbDbitOffset:" << ctbDbitOffset
--- a/slsReceiverSoftware/src/DataProcessor.h
+++ b/slsReceiverSoftware/src/DataProcessor.h
@ -177,7 +177,7 @@ class DataProcessor : private virtual slsDetectorDefs, public ThreadObject {
    uint32_t streamingTimerInMs;
    uint32_t streamingStartFnum;
    uint32_t currentFreqCount{0};
-    struct timespec timerbegin {};
+    struct timespec timerbegin{};
    bool framePadding;
    std::vector<int> ctbDbitList;
    bool reorder{false}; // true if data should be reordered TODO: add as mode
--- a/slsReceiverSoftware/src/GeneralData.h
+++ b/slsReceiverSoftware/src/GeneralData.h
@ -60,8 +60,8 @@ class GeneralData {
    slsDetectorDefs::frameDiscardPolicy frameDiscardMode{
        slsDetectorDefs::NO_DISCARD};

-    GeneralData(){};
-    virtual ~GeneralData(){};
+    GeneralData() {};
+    virtual ~GeneralData() {};

    // Returns the pixel depth in byte, 4 bits being 0.5 byte
    float GetPixelDepth() { return float(dynamicRange) / 8; }
@ -443,6 +443,7 @@ class ChipTestBoardData : public GeneralData {
        nDigitalBytes = 0;
        nTransceiverBytes = 0;
        int nAnalogChans = 0, nDigitalChans = 0, nTransceiverChans = 0;
+        uint64_t digital_bytes_reserved = 0;

        // analog channels (normal, analog/digital readout)
        if (readoutType == slsDetectorDefs::ANALOG_ONLY ||
@ -461,7 +462,12 @@ class ChipTestBoardData : public GeneralData {
            readoutType == slsDetectorDefs::ANALOG_AND_DIGITAL ||
            readoutType == slsDetectorDefs::DIGITAL_AND_TRANSCEIVER) {
            nDigitalChans = NCHAN_DIGITAL;
-            nDigitalBytes = (sizeof(uint64_t) * nDigitalSamples);
+            // allocate enough memory to support reordering of digital bits
+            uint32_t num_bytes_per_bit = (nDigitalSamples % 8 == 0)
+                                             ? nDigitalSamples / 8
+                                             : nDigitalSamples / 8 + 1;
+            digital_bytes_reserved = 64 * num_bytes_per_bit;
+            nDigitalBytes = sizeof(uint64_t) * nDigitalSamples;
            LOG(logDEBUG1) << "Number of Digital Channels:" << nDigitalChans
                           << " Databytes: " << nDigitalBytes;
        }
@ -480,7 +486,7 @@ class ChipTestBoardData : public GeneralData {
        nPixelsX = nAnalogChans + nDigitalChans + nTransceiverChans;
        dataSize = tengigaEnable ? 8144 : UDP_PACKET_DATA_BYTES;
        packetSize = headerSizeinPacket + dataSize;
-        imageSize = nAnalogBytes + nDigitalBytes + nTransceiverBytes;
+        imageSize = nAnalogBytes + digital_bytes_reserved + nTransceiverBytes;
        packetsPerFrame = ceil((double)imageSize / (double)dataSize);

        LOG(logDEBUG1) << "Total Number of Channels:" << nPixelsX
--- a/slsReceiverSoftware/tests/test-ArrangeDataBasedOnBitList.cpp
+++ b/slsReceiverSoftware/tests/test-ArrangeDataBasedOnBitList.cpp
@ -106,7 +106,11 @@ class DataProcessorTestFixture {

    void set_data() {
        delete[] data;
-        data = new char[get_size()];
+        uint64_t max_bytes_per_bit =
+            num_samples % 8 == 0 ? num_samples / 8 : num_samples / 8 + 1;
+        uint64_t reserved_size =
+            get_size() - num_digital_bytes + max_bytes_per_bit * 64;
+        data = new char[reserved_size];

        // set testing data
        memset(data, dummy_value, num_analog_bytes); // set to dummy value