TrackSoAHeterogeneous_test.cpp

CMSSW/CUDADataFormats/Track/test/TrackSoAHeterogeneous_test.cpp

Line Code

Line	Code
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73	`/*` `Simple test for the pixelTrack::TrackSoA data structure` `which inherits from PortableDeviceCollection.` `Creates an instance of the class (automatically allocates` `memory on device), passes the view of the SoA data to` `the CUDA kernels which:` `- Fill the SoA with data.` `- Verify that the data written is correct.` `Then, the SoA data are copied back to Host, where` `a temporary host-side view (tmp_view) is created using` `the same Layout to access the data on host and print it.` `/` `#include <cstdint>` `#include "CUDADataFormats/Track/interface/TrackSoAHeterogeneousDevice.h"` `#include "CUDADataFormats/Track/interface/TrackSoAHeterogeneousHost.h"` `#include "HeterogeneousCore/CUDAUtilities/interface/requireDevices.h"` `#include "HeterogeneousCore/CUDAUtilities/interface/cudaCheck.h"` `#include "Geometry/CommonTopologies/interface/SimplePixelTopology.h"` `namespace testTrackSoA {` `template <typename TrackerTraits>` `void runKernels(TrackSoAView<TrackerTraits> &tracks_view, cudaStream_t stream);` `}` `int main() {` `cms::cudatest::requireDevices();` `cudaStream_t stream;` `cudaCheck(cudaStreamCreateWithFlags(&stream, cudaStreamNonBlocking));` `// Inner scope to deallocate memory before destroying the stream` `{` `// Instantiate tracks on device. PortableDeviceCollection allocates` `// SoA on device automatically.` `TrackSoAHeterogeneousDevice<pixelTopology::Phase1> tracks_d(stream);` `testTrackSoA::runKernels<pixelTopology::Phase1>(tracks_d.view(), stream);` `// Instantate tracks on host. This is where the data will be` `// copied to from device.` `TrackSoAHeterogeneousHost<pixelTopology::Phase1> tracks_h(stream);` `cudaCheck(cudaMemcpyAsync(` `tracks_h.buffer().get(), tracks_d.const_buffer().get(), tracks_d.bufferSize(), cudaMemcpyDeviceToHost, stream));` `cudaCheck(cudaStreamSynchronize(stream));` `// Print results` `std::cout << "pt"` `<< "\t"` `<< "eta"` `<< "\t"` `<< "chi2"` `<< "\t"` `<< "quality"` `<< "\t"` `<< "nLayers"` `<< "\t"` `<< "hitIndices off" << std::endl;` `for (int i = 0; i < 10; ++i) {` `std::cout << tracks_h.view()[i].pt() << "\t" << tracks_h.view()[i].eta() << "\t" << tracks_h.view()[i].chi2()` `<< "\t" << (int)tracks_h.view()[i].quality() << "\t" << (int)tracks_h.view()[i].nLayers() << "\t"` `<< tracks_h.view().hitIndices().off[i] << std::endl;` `}` `}` `cudaCheck(cudaStreamDestroy(stream));` `return 0;` `}`

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73

/**
   Simple test for the pixelTrack::TrackSoA data structure
   which inherits from PortableDeviceCollection.

   Creates an instance of the class (automatically allocates
   memory on device), passes the view of the SoA data to
   the CUDA kernels which:
   - Fill the SoA with data.
   - Verify that the data written is correct.

   Then, the SoA data are copied back to Host, where
   a temporary host-side view (tmp_view) is created using
   the same Layout to access the data on host and print it.
 */

#include <cstdint>
#include "CUDADataFormats/Track/interface/TrackSoAHeterogeneousDevice.h"
#include "CUDADataFormats/Track/interface/TrackSoAHeterogeneousHost.h"
#include "HeterogeneousCore/CUDAUtilities/interface/requireDevices.h"
#include "HeterogeneousCore/CUDAUtilities/interface/cudaCheck.h"

#include "Geometry/CommonTopologies/interface/SimplePixelTopology.h"

namespace testTrackSoA {

  template <typename TrackerTraits>
  void runKernels(TrackSoAView<TrackerTraits> &tracks_view, cudaStream_t stream);
}

int main() {
  cms::cudatest::requireDevices();

  cudaStream_t stream;
  cudaCheck(cudaStreamCreateWithFlags(&stream, cudaStreamNonBlocking));

  // Inner scope to deallocate memory before destroying the stream
  {
    // Instantiate tracks on device. PortableDeviceCollection allocates
    // SoA on device automatically.
    TrackSoAHeterogeneousDevice<pixelTopology::Phase1> tracks_d(stream);
    testTrackSoA::runKernels<pixelTopology::Phase1>(tracks_d.view(), stream);

    // Instantate tracks on host. This is where the data will be
    // copied to from device.
    TrackSoAHeterogeneousHost<pixelTopology::Phase1> tracks_h(stream);

    cudaCheck(cudaMemcpyAsync(
        tracks_h.buffer().get(), tracks_d.const_buffer().get(), tracks_d.bufferSize(), cudaMemcpyDeviceToHost, stream));
    cudaCheck(cudaStreamSynchronize(stream));

    // Print results
    std::cout << "pt"
              << "\t"
              << "eta"
              << "\t"
              << "chi2"
              << "\t"
              << "quality"
              << "\t"
              << "nLayers"
              << "\t"
              << "hitIndices off" << std::endl;

    for (int i = 0; i < 10; ++i) {
      std::cout << tracks_h.view()[i].pt() << "\t" << tracks_h.view()[i].eta() << "\t" << tracks_h.view()[i].chi2()
                << "\t" << (int)tracks_h.view()[i].quality() << "\t" << (int)tracks_h.view()[i].nLayers() << "\t"
                << tracks_h.view().hitIndices().off[i] << std::endl;
    }
  }
  cudaCheck(cudaStreamDestroy(stream));

  return 0;
}