Warning, /HeterogeneousTest/CUDAWrapper/src/DeviceAdditionWrapper.cu is written in an unsupported language. File is not indexed.
0001 #include <cstddef>
0002
0003 #include <cuda_runtime.h>
0004
0005 #include "HeterogeneousTest/CUDAKernel/interface/DeviceAdditionKernel.h"
0006 #include "HeterogeneousTest/CUDAWrapper/interface/DeviceAdditionWrapper.h"
0007 #include "HeterogeneousCore/CUDAUtilities/interface/cudaCheck.h"
0008
0009 namespace cms::cudatest {
0010
0011 void wrapper_add_vectors_f(const float* __restrict__ in1,
0012 const float* __restrict__ in2,
0013 float* __restrict__ out,
0014 size_t size) {
0015 // launch the 1-dimensional kernel for vector addition
0016 kernel_add_vectors_f<<<32, 32>>>(in1, in2, out, size);
0017 cudaCheck(cudaGetLastError());
0018 }
0019
0020 void wrapper_add_vectors_d(const double* __restrict__ in1,
0021 const double* __restrict__ in2,
0022 double* __restrict__ out,
0023 size_t size) {
0024 // launch the 1-dimensional kernel for vector addition
0025 kernel_add_vectors_d<<<32, 32>>>(in1, in2, out, size);
0026 cudaCheck(cudaGetLastError());
0027 }
0028
0029 } // namespace cms::cudatest