de/d05/TestAlgo_8dev_8cc_source.html

 // Check that ALPAKA_HOST_ONLY is not defined during device compilation:
 #ifdef ALPAKA_HOST_ONLY
 #error ALPAKA_HOST_ONLY defined in device compilation
 #endif

 #include <alpaka/alpaka.hpp>

 #include "DataFormats/PortableTestObjects/interface/alpaka/TestDeviceCollection.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/config.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/traits.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/workdivision.h"

 #include "TestAlgo.h"

 namespace ALPAKA_ACCELERATOR_NAMESPACE {

   using namespace cms::alpakatools;

   class TestAlgoKernel {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestDeviceCollection::View view,
                                   int32_t size,
                                   double xvalue) const {
       const portabletest::Matrix matrix{{1, 2, 3, 4, 5, 6}, {2, 4, 6, 8, 10, 12}, {3, 6, 9, 12, 15, 18}};
       const portabletest::Array flags = {{6, 4, 2, 0}};

       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         view.r() = 1.;
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : elements_with_stride(acc, size)) {
         view[i] = {xvalue, 0., 0., i, flags, matrix * i};
       }
     }
   };

   void TestAlgo::fill(Queue& queue, portabletest::TestDeviceCollection& collection, double xvalue) const {
     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     uint32_t groups = divide_up_by(collection->metadata().size(), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoKernel{}, collection.view(), collection->metadata().size(), xvalue);
   }

   class TestAlgoStructKernel {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestDeviceObject::Product* data,
                                   double x,
                                   double y,
                                   double z,
                                   int32_t id) const {
       // run on a single thread
       if (once_per_grid(acc)) {
         data->x = x;
         data->y = y;
         data->z = z;
         data->id = id;
       }
     }
   };

   void TestAlgo::fillObject(
       Queue& queue, portabletest::TestDeviceObject& object, double x, double y, double z, int32_t id) const {
     // run on a single thread
     auto workDiv = make_workdiv<Acc1D>(1, 1);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoStructKernel{}, object.data(), x, y, z, id);
   }

   class TestAlgoKernelUpdate {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestDeviceCollection::ConstView input,
                                   AlpakaESTestDataEDevice::ConstView esData,
                                   portabletest::TestDeviceCollection::View output) const {
       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         output.r() = input.r();
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : elements_with_stride(acc, output.metadata().size())) {
         double x = input[i].x();
         if (i < esData.size()) {
           x += esData.val(i) + esData.val2(i);
         }
         output[i] = {x, input[i].y(), input[i].z(), input[i].id(), input[i].flags(), input[i].m()};
       }
     }
   };

   portabletest::TestDeviceCollection TestAlgo::update(Queue& queue,
                                                       portabletest::TestDeviceCollection const& input,
                                                       AlpakaESTestDataEDevice const& esData) const {
     portabletest::TestDeviceCollection collection{input->metadata().size(), queue};

     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     uint32_t groups = divide_up_by(collection->metadata().size(), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoKernelUpdate{}, input.view(), esData.view(), collection.view());

     return collection;
   }

 }  // namespace ALPAKA_ACCELERATOR_NAMESPACE
TestDeviceCollection.h

makeMuonMisalignmentScenario.matrix
list matrix
Definition: makeMuonMisalignmentScenario.py:141

mps_fire.i
i
Definition: mps_fire.py:429

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::fillObject
void fillObject(Queue &queue, portabletest::TestDeviceObject &object, double x, double y, double z, int32_t id) const
Definition: TestAlgo.dev.cc:75

cms::alpakatools::divide_up_by
constexpr Idx divide_up_by(Idx value, Idx divisor)
Definition: workdivision.h:19

cms::alpakatest::AlpakaESTestDataE::ConstView::size
constexpr auto size() const
Definition: AlpakaESTestData.h:50

portabletest::Matrix
Eigen::Matrix< double, 3, 6 > Matrix
Definition: TestSoA.h:19

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoStructKernel
Definition: TestAlgo.dev.cc:56

pv::view
view
Definition: PreparePVTrends.h:58

workdivision.h

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::update
portabletest::TestDeviceCollection update(Queue &queue, portabletest::TestDeviceCollection const &input, AlpakaESTestDataEDevice const &esData) const
Definition: TestAlgo.dev.cc:106

l1ctLayer2EG_cff.id
id
Definition: l1ctLayer2EG_cff.py:85

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernel::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceCollection::View view, int32_t size, double xvalue) const
Definition: TestAlgo.dev.cc:22

ALPAKA_ACCELERATOR_NAMESPACE::portabletest::TestDeviceCollection
PortableCollection< TestSoA > TestDeviceCollection
Definition: TestDeviceCollection.h:21

createBeamHaloJobs.queue
queue
Definition: createBeamHaloJobs.py:343

cms::alpakatools
Definition: PortableCollection.h:32

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoStructKernel::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceObject::Product *data, double x, double y, double z, int32_t id) const
Definition: TestAlgo.dev.cc:59

input
static std::string const input
Definition: EdmProvDump.cc:50

ALPAKA_ACCELERATOR_NAMESPACE
Definition: SiPixelCablingSoAESProducer.cc:21

ALPAKA_ACCELERATOR_NAMESPACE::portabletest::TestDeviceObject
PortableObject< TestStruct > TestDeviceObject
Definition: TestDeviceObject.h:18

universalConfigTemplate.collection
collection
Definition: universalConfigTemplate.py:81

cms::alpakatest::AlpakaESTestDataE::ConstView
Definition: AlpakaESTestData.h:45

edm::StdArray
Definition: StdArray.h:39

cms::alpakatest::AlpakaESTestDataE
Definition: AlpakaESTestData.h:40

cms::alpakatest::AlpakaESTestDataE::ConstView::val
constexpr int val(int i) const
Definition: AlpakaESTestData.h:51

traits.h

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdate
Definition: TestAlgo.dev.cc:83

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::fill
void fill(Queue &queue, portabletest::TestDeviceCollection &collection, double xvalue=0.) const
Definition: TestAlgo.dev.cc:41

mps_monitormerge.items
list items
Definition: mps_monitormerge.py:29

cms::alpakatools::elements_with_stride
Definition: workdivision.h:115

HLT_2023v12_cff.flags
flags
Definition: HLT_2023v12_cff.py:10091

TestAlgo.h

cms::alpakatest::AlpakaESTestDataE::view
ConstView view() const
Definition: AlpakaESTestData.h:66

cms::alpakatools::once_per_grid
ALPAKA_FN_ACC constexpr bool once_per_grid(TAcc const &acc)
Definition: workdivision.h:793

data
char data[epos_bytes_allocation]
Definition: EPOS_Wrapper.h:80

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernel
Definition: TestAlgo.dev.cc:19

x
float x
Definition: beamSpotDipStandalone.cc:55

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdate::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceCollection::ConstView input, AlpakaESTestDataEDevice::ConstView esData, portabletest::TestDeviceCollection::View output) const
Definition: TestAlgo.dev.cc:86

output
Definition: output.py:1

cms::alpakatest::AlpakaESTestDataE::ConstView::val2
constexpr int val2(int i) const
Definition: AlpakaESTestData.h:52

config.h

sistrip::View
View
Definition: ConstantsForView.h:26