CMS 3D CMS Logo

Functions
cms::rocmtest Namespace Reference

Functions

__device__ void add_vectors_d (const double *__restrict__ in1, const double *__restrict__ in2, double *__restrict__ out, size_t size)
 
__device__ void add_vectors_f (const float *__restrict__ in1, const float *__restrict__ in2, float *__restrict__ out, size_t size)
 
__global__ void kernel_add_vectors_d (const double *__restrict__ in1, const double *__restrict__ in2, double *__restrict__ out, size_t size)
 
__global__ void kernel_add_vectors_f (const float *__restrict__ in1, const float *__restrict__ in2, float *__restrict__ out, size_t size)
 
void opaque_add_vectors_d (const double *in1, const double *in2, double *out, size_t size)
 
void opaque_add_vectors_f (const float *in1, const float *in2, float *out, size_t size)
 
void requireDevices ()
 Print message and exit if there are no ROCm devices. More...
 
bool testDevices ()
 In presence of ROCm devices, return true; otherwise print message and return false. More...
 
void wrapper_add_vectors_d (const double *__restrict__ in1, const double *__restrict__ in2, double *__restrict__ out, size_t size)
 
void wrapper_add_vectors_f (const float *__restrict__ in1, const float *__restrict__ in2, float *__restrict__ out, size_t size)
 

Function Documentation

◆ add_vectors_d()

__device__ void cms::rocmtest::add_vectors_d ( const double *__restrict__  in1,
const double *__restrict__  in2,
double *__restrict__  out,
size_t  size 
)

Definition at line 22 of file DeviceAddition.hip.cc.

References cms::cudacompat::blockDim, cms::cudacompat::blockIdx, cms::cudacompat::gridDim, mps_fire::i, MillePedeFileConverter_cfg::out, riemannFit::stride, and cms::cudacompat::threadIdx.

Referenced by kernel_add_vectors_d().

25  {
26  uint32_t thread = threadIdx.x + blockIdx.x * blockDim.x;
27  uint32_t stride = blockDim.x * gridDim.x;
28 
29  for (size_t i = thread; i < size; i += stride) {
30  out[i] = in1[i] + in2[i];
31  }
32  }
const dim3 threadIdx
Definition: cudaCompat.h:29
size
Write out results.
const dim3 gridDim
Definition: cudaCompat.h:33
const dim3 blockDim
Definition: cudaCompat.h:30
constexpr uint32_t stride
Definition: HelixFit.h:22
const dim3 blockIdx
Definition: cudaCompat.h:32

◆ add_vectors_f()

__device__ void cms::rocmtest::add_vectors_f ( const float *__restrict__  in1,
const float *__restrict__  in2,
float *__restrict__  out,
size_t  size 
)

Definition at line 10 of file DeviceAddition.hip.cc.

References cms::cudacompat::blockDim, cms::cudacompat::blockIdx, cms::cudacompat::gridDim, mps_fire::i, MillePedeFileConverter_cfg::out, riemannFit::stride, and cms::cudacompat::threadIdx.

Referenced by kernel_add_vectors_f(), and HeterogeneousTestROCmDevicePlugins::kernel_add_vectors_f().

13  {
14  uint32_t thread = threadIdx.x + blockIdx.x * blockDim.x;
15  uint32_t stride = blockDim.x * gridDim.x;
16 
17  for (size_t i = thread; i < size; i += stride) {
18  out[i] = in1[i] + in2[i];
19  }
20  }
const dim3 threadIdx
Definition: cudaCompat.h:29
size
Write out results.
const dim3 gridDim
Definition: cudaCompat.h:33
const dim3 blockDim
Definition: cudaCompat.h:30
constexpr uint32_t stride
Definition: HelixFit.h:22
const dim3 blockIdx
Definition: cudaCompat.h:32

◆ kernel_add_vectors_d()

__global__ void cms::rocmtest::kernel_add_vectors_d ( const double *__restrict__  in1,
const double *__restrict__  in2,
double *__restrict__  out,
size_t  size 
)

Definition at line 17 of file DeviceAdditionKernel.hip.cc.

References add_vectors_d(), and MillePedeFileConverter_cfg::out.

20  {
21  add_vectors_d(in1, in2, out, size);
22  }
size
Write out results.
ALPAKA_FN_ACC void add_vectors_d(Acc1D const &acc, double const *__restrict__ in1, double const *__restrict__ in2, double *__restrict__ out, uint32_t size)

◆ kernel_add_vectors_f()

__global__ void cms::rocmtest::kernel_add_vectors_f ( const float *__restrict__  in1,
const float *__restrict__  in2,
float *__restrict__  out,
size_t  size 
)

Definition at line 10 of file DeviceAdditionKernel.hip.cc.

References add_vectors_f(), and MillePedeFileConverter_cfg::out.

13  {
14  add_vectors_f(in1, in2, out, size);
15  }
size
Write out results.
ALPAKA_FN_ACC void add_vectors_f(Acc1D const &acc, float const *__restrict__ in1, float const *__restrict__ in2, float *__restrict__ out, uint32_t size)

◆ opaque_add_vectors_d()

void cms::rocmtest::opaque_add_vectors_d ( const double *  in1,
const double *  in2,
double *  out,
size_t  size 
)

Definition at line 42 of file DeviceAdditionOpaque.cc.

References hipCheck, and wrapper_add_vectors_d().

42  {
43  // allocate input and output buffers on the device
44  double* in1_d;
45  double* in2_d;
46  double* out_d;
47  hipCheck(hipMalloc(&in1_d, size * sizeof(double)));
48  hipCheck(hipMalloc(&in2_d, size * sizeof(double)));
49  hipCheck(hipMalloc(&out_d, size * sizeof(double)));
50 
51  // copy the input data to the device
52  hipCheck(hipMemcpy(in1_d, in1_h, size * sizeof(double), hipMemcpyHostToDevice));
53  hipCheck(hipMemcpy(in2_d, in2_h, size * sizeof(double), hipMemcpyHostToDevice));
54 
55  // fill the output buffer with zeros
56  hipCheck(hipMemset(out_d, 0, size * sizeof(double)));
57 
58  // launch the 1-dimensional kernel for vector addition
59  wrapper_add_vectors_d(in1_d, in2_d, out_d, size);
60 
61  // copy the results from the device to the host
62  hipCheck(hipMemcpy(out_h, out_d, size * sizeof(double), hipMemcpyDeviceToHost));
63 
64  // wait for all the operations to complete
65  hipCheck(hipDeviceSynchronize());
66 
67  // free the input and output buffers on the device
68  hipCheck(hipFree(in1_d));
69  hipCheck(hipFree(in2_d));
70  hipCheck(hipFree(out_d));
71  }
size
Write out results.
void wrapper_add_vectors_d(Queue &queue, const double *__restrict__ in1, const double *__restrict__ in2, double *__restrict__ out, uint32_t size)
#define hipCheck(ARG,...)
Definition: hipCheck.h:52

◆ opaque_add_vectors_f()

void cms::rocmtest::opaque_add_vectors_f ( const float *  in1,
const float *  in2,
float *  out,
size_t  size 
)

Definition at line 11 of file DeviceAdditionOpaque.cc.

References hipCheck, and wrapper_add_vectors_f().

Referenced by ROCmTestOpaqueAdditionModule::analyze().

11  {
12  // allocate input and output buffers on the device
13  float* in1_d;
14  float* in2_d;
15  float* out_d;
16  hipCheck(hipMalloc(&in1_d, size * sizeof(float)));
17  hipCheck(hipMalloc(&in2_d, size * sizeof(float)));
18  hipCheck(hipMalloc(&out_d, size * sizeof(float)));
19 
20  // copy the input data to the device
21  hipCheck(hipMemcpy(in1_d, in1_h, size * sizeof(float), hipMemcpyHostToDevice));
22  hipCheck(hipMemcpy(in2_d, in2_h, size * sizeof(float), hipMemcpyHostToDevice));
23 
24  // fill the output buffer with zeros
25  hipCheck(hipMemset(out_d, 0, size * sizeof(float)));
26 
27  // launch the 1-dimensional kernel for vector addition
28  wrapper_add_vectors_f(in1_d, in2_d, out_d, size);
29 
30  // copy the results from the device to the host
31  hipCheck(hipMemcpy(out_h, out_d, size * sizeof(float), hipMemcpyDeviceToHost));
32 
33  // wait for all the operations to complete
34  hipCheck(hipDeviceSynchronize());
35 
36  // free the input and output buffers on the device
37  hipCheck(hipFree(in1_d));
38  hipCheck(hipFree(in2_d));
39  hipCheck(hipFree(out_d));
40  }
size
Write out results.
#define hipCheck(ARG,...)
Definition: hipCheck.h:52
void wrapper_add_vectors_f(Queue &queue, const float *__restrict__ in1, const float *__restrict__ in2, float *__restrict__ out, uint32_t size)

◆ requireDevices()

void cms::rocmtest::requireDevices ( )

Print message and exit if there are no ROCm devices.

Definition at line 24 of file requireDevices.cc.

References beamvalidation::exit(), and testDevices().

24  {
25  if (not testDevices()) {
26  exit(EXIT_SUCCESS);
27  }
28  }
bool testDevices()
In presence of CUDA devices, return true; otherwise print message and return false.
def exit(msg="")

◆ testDevices()

bool cms::rocmtest::testDevices ( )

In presence of ROCm devices, return true; otherwise print message and return false.

Definition at line 10 of file requireDevices.cc.

References DMR_cfg::cerr, cms::alpakatools::devices(), and mps_update::status.

Referenced by requireDevices().

10  {
11  int devices = 0;
12  auto status = hipGetDeviceCount(&devices);
13  if (status != hipSuccess) {
14  std::cerr << "Failed to initialise the ROCm runtime, the test will be skipped.\n";
15  return false;
16  }
17  if (devices == 0) {
18  std::cerr << "No ROCm devices available, the test will be skipped.\n";
19  return false;
20  }
21  return true;
22  }
std::vector< alpaka::Dev< TPlatform > > const & devices()
Definition: devices.h:22

◆ wrapper_add_vectors_d()

void cms::rocmtest::wrapper_add_vectors_d ( const double *__restrict__  in1,
const double *__restrict__  in2,
double *__restrict__  out,
size_t  size 
)

Definition at line 20 of file DeviceAdditionWrapper.hip.cc.

References hipCheck, and MillePedeFileConverter_cfg::out.

Referenced by cms::cudatest::opaque_add_vectors_d(), and opaque_add_vectors_d().

23  {
24  // launch the 1-dimensional kernel for vector addition
25  kernel_add_vectors_d<<<32, 32>>>(in1, in2, out, size);
26  hipCheck(hipGetLastError());
27  }
size
Write out results.
#define hipCheck(ARG,...)
Definition: hipCheck.h:52

◆ wrapper_add_vectors_f()

void cms::rocmtest::wrapper_add_vectors_f ( const float *__restrict__  in1,
const float *__restrict__  in2,
float *__restrict__  out,
size_t  size 
)

Definition at line 11 of file DeviceAdditionWrapper.hip.cc.

References hipCheck, and MillePedeFileConverter_cfg::out.

Referenced by CUDATestWrapperAdditionModule::analyze(), ROCmTestWrapperAdditionModule::analyze(), CUDATestKernelAdditionModule::analyze(), CUDATestDeviceAdditionModule::analyze(), cms::cudatest::opaque_add_vectors_f(), and opaque_add_vectors_f().

14  {
15  // launch the 1-dimensional kernel for vector addition
16  kernel_add_vectors_f<<<32, 32>>>(in1, in2, out, size);
17  hipCheck(hipGetLastError());
18  }
size
Write out results.
#define hipCheck(ARG,...)
Definition: hipCheck.h:52