HGCRecHitGPUProduct

Macros

Line Code
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
#ifndef CUDADAtaFormats_HGCal_HGCRecHitGPUProduct_H
#define CUDADAtaFormats_HGCal_HGCRecHitGPUProduct_H

#include <cassert>
#include <numeric>

#include "HeterogeneousCore/CUDAUtilities/interface/device_unique_ptr.h"
#include "CUDADataFormats/HGCal/interface/HGCRecHitSoA.h"
#include "CUDADataFormats/HGCal/interface/ConstHGCRecHitSoA.h"
#include "CUDADataFormats/HGCal/interface/HGCUncalibRecHitSoA.h"

class HGCRecHitGPUProduct {
public:
  HGCRecHitGPUProduct() = default;
  explicit HGCRecHitGPUProduct(uint32_t nhits, const cudaStream_t &stream) : nhits_(nhits) {
    size_tot_ = std::accumulate(sizes_.begin(), sizes_.end(), 0);  //this might be done at compile time
    pad_ = ((nhits - 1) / 32 + 1) * 32;                            //align to warp boundary (assumption: warpSize = 32)
    mem_ = cms::cuda::make_device_unique<std::byte[]>(pad_ * size_tot_, stream);
  }
  ~HGCRecHitGPUProduct() = default;

  HGCRecHitGPUProduct(const HGCRecHitGPUProduct &) = delete;
  HGCRecHitGPUProduct &operator=(const HGCRecHitGPUProduct &) = delete;
  HGCRecHitGPUProduct(HGCRecHitGPUProduct &&) = default;
  HGCRecHitGPUProduct &operator=(HGCRecHitGPUProduct &&) = default;

  HGCRecHitSoA get() {
    HGCRecHitSoA soa;
    soa.energy_ = reinterpret_cast<float *>(mem_.get());
    soa.time_ = soa.energy_ + pad_;
    soa.timeError_ = soa.time_ + pad_;
    soa.id_ = reinterpret_cast<uint32_t *>(soa.timeError_ + pad_);
    soa.flagBits_ = soa.id_ + pad_;
    soa.son_ = reinterpret_cast<uint8_t *>(soa.flagBits_ + pad_);
    soa.nbytes_ = size_tot_;
    soa.nhits_ = nhits_;
    soa.pad_ = pad_;
    return soa;
  }
  ConstHGCRecHitSoA get() const {
    ConstHGCRecHitSoA soa;
    soa.energy_ = reinterpret_cast<float const *>(mem_.get());
    soa.time_ = soa.energy_ + pad_;
    soa.timeError_ = soa.time_ + pad_;
    soa.id_ = reinterpret_cast<uint32_t const *>(soa.timeError_ + pad_);
    soa.flagBits_ = soa.id_ + pad_;
    soa.son_ = reinterpret_cast<uint8_t const *>(soa.flagBits_ + pad_);
    return soa;
  }

  //number of hits stored in the SoA
  uint32_t nHits() const { return nhits_; }
  //pad of memory block (used for warp alignment, slighlty larger than 'nhits_')
  uint32_t pad() const { return pad_; }
  //number of bytes of the SoA
  uint32_t nBytes() const { return size_tot_; }

private:
  cms::cuda::device::unique_ptr<std::byte[]> mem_;
  static constexpr std::array<int, memory::npointers::ntypes_hgcrechits_soa> sizes_ = {
      {memory::npointers::float_hgcrechits_soa * sizeof(float),
       memory::npointers::uint32_hgcrechits_soa * sizeof(uint32_t),
       memory::npointers::uint8_hgcrechits_soa * sizeof(uint8_t)}};
  uint32_t pad_;
  uint32_t nhits_;
  uint32_t size_tot_;
};

#endif  //CUDADAtaFormats_HGCal_HGCRecHitGPUProduct_H