de/d05/TestAlgo_8dev_8cc_source.html

 // Check that ALPAKA_HOST_ONLY is not defined during device compilation:
 #ifdef ALPAKA_HOST_ONLY
 #error ALPAKA_HOST_ONLY defined in device compilation
 #endif

 #include <alpaka/alpaka.hpp>

 #include "DataFormats/PortableTestObjects/interface/alpaka/TestDeviceCollection.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/config.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/workdivision.h"

 #include "TestAlgo.h"

 namespace ALPAKA_ACCELERATOR_NAMESPACE {

   using namespace cms::alpakatools;

   class TestAlgoKernel {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc, portabletest::TestDeviceCollection::View view, double xvalue) const {
       const portabletest::Matrix matrix{{1, 2, 3, 4, 5, 6}, {2, 4, 6, 8, 10, 12}, {3, 6, 9, 12, 15, 18}};
       const portabletest::Array flags = {{6, 4, 2, 0}};

       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         view.r() = 1.;
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, view.metadata().size())) {
         view[i] = {xvalue, 0., 0., i, flags, matrix * i};
       }
     }
   };

   class TestAlgoMultiKernel2 {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestDeviceMultiCollection2::View<1> view,
                                   double xvalue) const {
       const portabletest::Matrix matrix{{1, 2, 3, 4, 5, 6}, {2, 4, 6, 8, 10, 12}, {3, 6, 9, 12, 15, 18}};

       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         view.r2() = 2.;
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, view.metadata().size())) {
         view[i] = {xvalue, 0., 0., i, matrix * i};
       }
     }
   };

   class TestAlgoMultiKernel3 {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestDeviceMultiCollection3::View<2> view,
                                   double xvalue) const {
       const portabletest::Matrix matrix{{1, 2, 3, 4, 5, 6}, {2, 4, 6, 8, 10, 12}, {3, 6, 9, 12, 15, 18}};

       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         view.r3() = 3.;
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, view.metadata().size())) {
         view[i] = {xvalue, 0., 0., i, matrix * i};
       }
     }
   };

   void TestAlgo::fill(Queue& queue, portabletest::TestDeviceCollection& collection, double xvalue) const {
     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     uint32_t groups = divide_up_by(collection->metadata().size(), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoKernel{}, collection.view(), xvalue);
   }

   void TestAlgo::fillMulti2(Queue& queue, portabletest::TestDeviceMultiCollection2& collection, double xvalue) const {
     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     uint32_t groups = divide_up_by(collection->metadata().size(), items);
     uint32_t groups2 = divide_up_by(collection.view<1>().metadata().size(), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);
     auto workDiv2 = make_workdiv<Acc1D>(groups2, items);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoKernel{}, collection.view<portabletest::TestSoA>(), xvalue);
     alpaka::exec<Acc1D>(queue, workDiv2, TestAlgoMultiKernel2{}, collection.view<portabletest::TestSoA2>(), xvalue);
   }

   class TestAlgoStructKernel {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestDeviceObject::Product* data,
                                   double x,
                                   double y,
                                   double z,
                                   int32_t id) const {
       // run on a single thread
       if (once_per_grid(acc)) {
         data->x = x;
         data->y = y;
         data->z = z;
         data->id = id;
       }
     }
   };

   void TestAlgo::fillObject(
       Queue& queue, portabletest::TestDeviceObject& object, double x, double y, double z, int32_t id) const {
     // run on a single thread
     auto workDiv = make_workdiv<Acc1D>(1, 1);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoStructKernel{}, object.data(), x, y, z, id);
   }

   void TestAlgo::fillMulti3(Queue& queue, portabletest::TestDeviceMultiCollection3& collection, double xvalue) const {
     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     uint32_t groups = divide_up_by(collection.view<portabletest::TestSoA>().metadata().size(), items);
     uint32_t groups2 = divide_up_by(collection.view<portabletest::TestSoA2>().metadata().size(), items);
     uint32_t groups3 = divide_up_by(collection.view<portabletest::TestSoA3>().metadata().size(), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);
     auto workDiv2 = make_workdiv<Acc1D>(groups2, items);
     auto workDiv3 = make_workdiv<Acc1D>(groups3, items);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoKernel{}, collection.view<portabletest::TestSoA>(), xvalue);
     alpaka::exec<Acc1D>(queue, workDiv2, TestAlgoMultiKernel2{}, collection.view<portabletest::TestSoA2>(), xvalue);
     alpaka::exec<Acc1D>(queue, workDiv3, TestAlgoMultiKernel3{}, collection.view<portabletest::TestSoA3>(), xvalue);
   }

   class TestAlgoKernelUpdate {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestDeviceCollection::ConstView input,
                                   AlpakaESTestDataEDevice::ConstView esData,
                                   portabletest::TestDeviceCollection::View output) const {
       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         output.r() = input.r();
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, output.metadata().size())) {
         double x = input[i].x();
         if (i < esData.size()) {
           x += esData.val(i) + esData.val2(i);
         }
         output[i] = {x, input[i].y(), input[i].z(), input[i].id(), input[i].flags(), input[i].m()};
       }
     }
   };

   class TestAlgoKernelUpdateMulti2 {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestSoA::ConstView input,
                                   portabletest::TestSoA2::ConstView input2,
                                   AlpakaESTestDataEDevice::ConstView esData,
                                   portabletest::TestSoA::View output,
                                   portabletest::TestSoA2::View output2) const {
       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         output.r() = input.r();
         output2.r2() = input2.r2();
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, output.metadata().size())) {
         double x = input[i].x();
         if (i < esData.size()) {
           x += esData.val(i) + esData.val2(i);
         }
         output[i] = {x, input[i].y(), input[i].z(), input[i].id(), input[i].flags(), input[i].m()};
       }
       for (int32_t i : uniform_elements(acc, output2.metadata().size())) {
         double x2 = input2[i].x2();
         if (i < esData.size()) {
           x2 += esData.val(i) + esData.val2(i);
         }
         output2[i] = {x2, input2[i].y2(), input2[i].z2(), input2[i].id2(), input2[i].m2()};
       }
     }
   };

   class TestAlgoKernelUpdateMulti3 {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc,
                                   portabletest::TestSoA::ConstView input,
                                   portabletest::TestSoA2::ConstView input2,
                                   portabletest::TestSoA3::ConstView input3,
                                   AlpakaESTestDataEDevice::ConstView esData,
                                   portabletest::TestSoA::View output,
                                   portabletest::TestSoA2::View output2,
                                   portabletest::TestSoA3::View output3) const {
       // set this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         output.r() = input.r();
         output2.r2() = input2.r2();
         output3.r3() = input3.r3();
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, output.metadata().size())) {
         double x = input[i].x();
         if (i < esData.size()) {
           x += esData.val(i) + esData.val2(i);
           if (0 == i)
             printf("Setting x[0] to %f\n", x);
         }
         output[i] = {x, input[i].y(), input[i].z(), input[i].id(), input[i].flags(), input[i].m()};
       }
       for (int32_t i : uniform_elements(acc, output2.metadata().size())) {
         double x2 = input2[i].x2();
         if (i < esData.size()) {
           x2 += esData.val(i) + esData.val2(i);
         }
         output2[i] = {x2, input2[i].y2(), input2[i].z2(), input2[i].id2(), input2[i].m2()};
       }
       for (int32_t i : uniform_elements(acc, output3.metadata().size())) {
         double x3 = input3[i].x3();
         if (i < esData.size()) {
           x3 += esData.val(i) + esData.val2(i);
         }
         output3[i] = {x3, input3[i].y3(), input3[i].z3(), input3[i].id3(), input3[i].m3()};
       }
     }
   };

   portabletest::TestDeviceCollection TestAlgo::update(Queue& queue,
                                                       portabletest::TestDeviceCollection const& input,
                                                       AlpakaESTestDataEDevice const& esData) const {
     portabletest::TestDeviceCollection collection{input->metadata().size(), queue};

     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     uint32_t groups = divide_up_by(collection->metadata().size(), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);

     alpaka::exec<Acc1D>(queue, workDiv, TestAlgoKernelUpdate{}, input.view(), esData.view(), collection.view());

     return collection;
   }

   portabletest::TestDeviceMultiCollection2 TestAlgo::updateMulti2(Queue& queue,
                                                                   portabletest::TestDeviceMultiCollection2 const& input,
                                                                   AlpakaESTestDataEDevice const& esData) const {
     portabletest::TestDeviceMultiCollection2 collection{input.sizes(), queue};

     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     auto sizes = collection.sizes();
     uint32_t groups = divide_up_by(*std::max_element(sizes.begin(), sizes.end()), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);

     alpaka::exec<Acc1D>(queue,
                         workDiv,
                         TestAlgoKernelUpdateMulti2{},
                         input.view<portabletest::TestSoA>(),
                         input.view<portabletest::TestSoA2>(),
                         esData.view(),
                         collection.view<portabletest::TestSoA>(),
                         collection.view<portabletest::TestSoA2>());

     return collection;
   }

   portabletest::TestDeviceMultiCollection3 TestAlgo::updateMulti3(Queue& queue,
                                                                   portabletest::TestDeviceMultiCollection3 const& input,
                                                                   AlpakaESTestDataEDevice const& esData) const {
     portabletest::TestDeviceMultiCollection3 collection{input.sizes(), queue};

     // use 64 items per group (this value is arbitrary, but it's a reasonable starting point)
     uint32_t items = 64;

     // use as many groups as needed to cover the whole problem
     auto sizes = collection.sizes();
     uint32_t groups = divide_up_by(*std::max_element(sizes.begin(), sizes.end()), items);

     // map items to
     //   - threads with a single element per thread on a GPU backend
     //   - elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(groups, items);

     alpaka::exec<Acc1D>(queue,
                         workDiv,
                         TestAlgoKernelUpdateMulti3{},
                         input.view<portabletest::TestSoA>(),
                         input.view<portabletest::TestSoA2>(),
                         input.view<portabletest::TestSoA3>(),
                         esData.view(),
                         collection.view<portabletest::TestSoA>(),
                         collection.view<portabletest::TestSoA2>(),
                         collection.view<portabletest::TestSoA3>());

     return collection;
   }

   class TestZeroCollectionKernel {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc, portabletest::TestDeviceCollection::ConstView view) const {
       const portabletest::Matrix matrix{{0, 0, 0, 0, 0, 0}, {0, 0, 0, 0, 0, 0}, {0, 0, 0, 0, 0, 0}};
       const portabletest::Array flags = {{0, 0, 0, 0}};

       // check this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         ALPAKA_ASSERT(view.r() == 0.);
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, view.metadata().size())) {
         auto element = view[i];
         ALPAKA_ASSERT(element.x() == 0.);
         ALPAKA_ASSERT(element.y() == 0.);
         ALPAKA_ASSERT(element.z() == 0.);
         ALPAKA_ASSERT(element.id() == 0.);
         ALPAKA_ASSERT(element.flags() == flags);
         ALPAKA_ASSERT(element.m() == matrix);
       }
     }
   };

   class TestZeroMultiCollectionKernel2 {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc, portabletest::TestDeviceMultiCollection2::ConstView<1> view) const {
       const portabletest::Matrix matrix{{0, 0, 0, 0, 0, 0}, {0, 0, 0, 0, 0, 0}, {0, 0, 0, 0, 0, 0}};

       // check this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         ALPAKA_ASSERT(view.r2() == 0.);
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, view.metadata().size())) {
         auto element = view[i];
         ALPAKA_ASSERT(element.x2() == 0.);
         ALPAKA_ASSERT(element.y2() == 0.);
         ALPAKA_ASSERT(element.z2() == 0.);
         ALPAKA_ASSERT(element.id2() == 0.);
         ALPAKA_ASSERT(element.m2() == matrix);
       }
     }
   };

   class TestZeroMultiCollectionKernel3 {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc, portabletest::TestDeviceMultiCollection3::ConstView<2> view) const {
       const portabletest::Matrix matrix{{0, 0, 0, 0, 0, 0}, {0, 0, 0, 0, 0, 0}, {0, 0, 0, 0, 0, 0}};

       // check this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         ALPAKA_ASSERT(view.r3() == 0.);
       }

       // make a strided loop over the kernel grid, covering up to "size" elements
       for (int32_t i : uniform_elements(acc, view.metadata().size())) {
         auto element = view[i];
         ALPAKA_ASSERT(element.x3() == 0.);
         ALPAKA_ASSERT(element.y3() == 0.);
         ALPAKA_ASSERT(element.z3() == 0.);
         ALPAKA_ASSERT(element.id3() == 0.);
         ALPAKA_ASSERT(element.m3() == matrix);
       }
     }
   };

   class TestZeroStructKernel {
   public:
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC void operator()(TAcc const& acc, portabletest::TestDeviceObject::Product const* data) const {
       // check this only once in the whole kernel grid
       if (once_per_grid(acc)) {
         ALPAKA_ASSERT(data->x == 0.);
         ALPAKA_ASSERT(data->y == 0.);
         ALPAKA_ASSERT(data->z == 0.);
         ALPAKA_ASSERT(data->id == 0);
       }
     }
   };

   // Check that the collection has been filled with zeroes.
   void TestAlgo::checkZero(Queue& queue, portabletest::TestDeviceCollection const& collection) const {
     // create a work division with a single block and
     //   - 32 threads with a single element per thread on a GPU backend
     //   - 32 elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(1, 32);

     // the kernel will make a strided loop over the launch grid to cover all elements in the collection
     alpaka::exec<Acc1D>(queue, workDiv, TestZeroCollectionKernel{}, collection.const_view());
   }

   // Check that the collection has been filled with zeroes.
   void TestAlgo::checkZero(Queue& queue, portabletest::TestDeviceMultiCollection2 const& collection) const {
     // create a work division with a single block and
     //   - 32 threads with a single element per thread on a GPU backend
     //   - 32 elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(1, 32);

     // the kernels will make a strided loop over the launch grid to cover all elements in the collection
     alpaka::exec<Acc1D>(queue, workDiv, TestZeroCollectionKernel{}, collection.const_view<portabletest::TestSoA>());
     alpaka::exec<Acc1D>(
         queue, workDiv, TestZeroMultiCollectionKernel2{}, collection.const_view<portabletest::TestSoA2>());
   }

   // Check that the collection has been filled with zeroes.
   void TestAlgo::checkZero(Queue& queue, portabletest::TestDeviceMultiCollection3 const& collection) const {
     // create a work division with a single block and
     //   - 32 threads with a single element per thread on a GPU backend
     //   - 32 elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(1, 32);

     // the kernels will make a strided loop over the launch grid to cover all elements in the collection
     alpaka::exec<Acc1D>(queue, workDiv, TestZeroCollectionKernel{}, collection.const_view<portabletest::TestSoA>());
     alpaka::exec<Acc1D>(
         queue, workDiv, TestZeroMultiCollectionKernel2{}, collection.const_view<portabletest::TestSoA2>());
     alpaka::exec<Acc1D>(
         queue, workDiv, TestZeroMultiCollectionKernel3{}, collection.const_view<portabletest::TestSoA3>());
   }

   // Check that the object has been filled with zeroes.
   void TestAlgo::checkZero(Queue& queue, portabletest::TestDeviceObject const& object) const {
     // create a work division with a single block and
     //   - 32 threads with a single element per thread on a GPU backend
     //   - 32 elements within a single thread on a CPU backend
     auto workDiv = make_workdiv<Acc1D>(1, 32);

     // the kernel will actually use a single thread
     alpaka::exec<Acc1D>(queue, workDiv, TestZeroStructKernel{}, object.data());
   }

 }  // namespace ALPAKA_ACCELERATOR_NAMESPACE
TestDeviceCollection.h

makeMuonMisalignmentScenario.matrix
list matrix
Definition: makeMuonMisalignmentScenario.py:141

cms::alpakatools::uniform_elements
ALPAKA_FN_ACC auto uniform_elements(TAcc const &acc, TArgs... args)
Definition: workdivision.h:311

mps_fire.i
i
Definition: mps_fire.py:429

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::fillObject
void fillObject(Queue &queue, portabletest::TestDeviceObject &object, double x, double y, double z, int32_t id) const
Definition: TestAlgo.dev.cc:129

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroMultiCollectionKernel2
Definition: TestAlgo.dev.cc:365

portabletest::TestSoALayout2::ConstViewTemplateFreeParams
Definition: TestSoA.h:45

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernel::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceCollection::View view, double xvalue) const
Definition: TestAlgo.dev.cc:21

cms::alpakatools::divide_up_by
constexpr Idx divide_up_by(Idx value, Idx divisor)
Definition: workdivision.h:20

portabletest::TestSoALayout3::ConstViewTemplateFreeParams
Definition: TestSoA.h:57

cms::alpakatest::AlpakaESTestDataE::ConstView::size
constexpr auto size() const
Definition: AlpakaESTestData.h:50

portabletest::Matrix
Eigen::Matrix< double, 3, 6 > Matrix
Definition: TestSoA.h:19

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoStructKernel
Definition: TestAlgo.dev.cc:110

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroMultiCollectionKernel3::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceMultiCollection3::ConstView< 2 > view) const
Definition: TestAlgo.dev.cc:391

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroStructKernel
Definition: TestAlgo.dev.cc:411

pv::view
view
Definition: PreparePVTrends.h:58

workdivision.h

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::update
portabletest::TestDeviceCollection update(Queue &queue, portabletest::TestDeviceCollection const &input, AlpakaESTestDataEDevice const &esData) const
Definition: TestAlgo.dev.cc:259

ALPAKA_ACCELERATOR_NAMESPACE::portabletest::TestDeviceCollection
PortableCollection< TestSoA > TestDeviceCollection
Definition: TestDeviceCollection.h:21

createBeamHaloJobs.queue
queue
Definition: createBeamHaloJobs.py:343

input2
#define input2
Definition: AMPTWrapper.h:159

cms::alpakatools
Definition: HcalRecoParamWithPulseShapeHost.h:11

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroCollectionKernel::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceCollection::ConstView view) const
Definition: TestAlgo.dev.cc:343

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoStructKernel::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceObject::Product *data, double x, double y, double z, int32_t id) const
Definition: TestAlgo.dev.cc:113

input
static std::string const input
Definition: EdmProvDump.cc:50

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdateMulti2
Definition: TestAlgo.dev.cc:181

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoMultiKernel2::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceMultiCollection2::View< 1 > view, double xvalue) const
Definition: TestAlgo.dev.cc:40

ALPAKA_ACCELERATOR_NAMESPACE
Definition: SiPixelCablingSoAESProducer.cc:21

portabletest::TestSoALayout2::ViewTemplateFreeParams
Definition: TestSoA.h:45

ALPAKA_ACCELERATOR_NAMESPACE::portabletest::TestDeviceObject
PortableObject< TestStruct > TestDeviceObject
Definition: TestDeviceObject.h:18

universalConfigTemplate.collection
collection
Definition: universalConfigTemplate.py:81

portabletest::TestSoALayout3::ViewTemplateFreeParams
Definition: TestSoA.h:57

portabletest::TestSoALayout
Definition: TestSoA.h:33

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroMultiCollectionKernel3
Definition: TestAlgo.dev.cc:388

cms::alpakatest::AlpakaESTestDataE::ConstView
Definition: AlpakaESTestData.h:45

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::fillMulti2
void fillMulti2(Queue &queue, portabletest::TestDeviceMultiCollection2 &collection, double xvalue=0.) const
Definition: TestAlgo.dev.cc:92

portabletest::TestSoALayout2
Definition: TestSoA.h:45

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::updateMulti2
portabletest::TestDeviceMultiCollection2 updateMulti2(Queue &queue, portabletest::TestDeviceMultiCollection2 const &input, AlpakaESTestDataEDevice const &esData) const
Definition: TestAlgo.dev.cc:280

edm::StdArray
Definition: StdArray.h:39

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroCollectionKernel
Definition: TestAlgo.dev.cc:340

cms::alpakatest::AlpakaESTestDataE
Definition: AlpakaESTestData.h:40

portabletest::TestSoALayout::ConstViewTemplateFreeParams
Definition: TestSoA.h:33

cms::alpakatest::AlpakaESTestDataE::ConstView::val
constexpr int val(int i) const
Definition: AlpakaESTestData.h:51

HLT_2024v14_cff.flags
flags
Definition: HLT_2024v14_cff.py:10240

portabletest::TestSoALayout::ViewTemplateFreeParams
Definition: TestSoA.h:33

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoMultiKernel2
Definition: TestAlgo.dev.cc:37

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroMultiCollectionKernel2::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceMultiCollection2::ConstView< 1 > view) const
Definition: TestAlgo.dev.cc:368

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdate
Definition: TestAlgo.dev.cc:158

ALPAKA_ACCELERATOR_NAMESPACE::portabletest::TestDeviceMultiCollection3
PortableCollection3< TestSoA, TestSoA2, TestSoA3 > TestDeviceMultiCollection3
Definition: TestDeviceCollection.h:25

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::fill
void fill(Queue &queue, portabletest::TestDeviceCollection &collection, double xvalue=0.) const
Definition: TestAlgo.dev.cc:77

skim900GeV_StreamA_MinBiasPD_cfg.output2
output2
Definition: skim900GeV_StreamA_MinBiasPD_cfg.py:226

mps_monitormerge.items
list items
Definition: mps_monitormerge.py:29

ALPAKA_ACCELERATOR_NAMESPACE::TestZeroStructKernel::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceObject::Product const *data) const
Definition: TestAlgo.dev.cc:414

EcalPhiSymFlatTableProducers_cfi.id
id
Definition: EcalPhiSymFlatTableProducers_cfi.py:11

TestAlgo.h

cms::alpakatest::AlpakaESTestDataE::view
ConstView view() const
Definition: AlpakaESTestData.h:66

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoMultiKernel3
Definition: TestAlgo.dev.cc:57

cms::alpakatools::once_per_grid
ALPAKA_FN_ACC constexpr bool once_per_grid(TAcc const &acc)
Definition: workdivision.h:1382

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::checkZero
void checkZero(Queue &queue, portabletest::TestDeviceCollection const &collection) const
Definition: TestAlgo.dev.cc:426

data
char data[epos_bytes_allocation]
Definition: EPOS_Wrapper.h:80

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernel
Definition: TestAlgo.dev.cc:18

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdateMulti2::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestSoA::ConstView input, portabletest::TestSoA2::ConstView input2, AlpakaESTestDataEDevice::ConstView esData, portabletest::TestSoA::View output, portabletest::TestSoA2::View output2) const
Definition: TestAlgo.dev.cc:184

x
float x
Definition: beamSpotDipStandalone.cc:55

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdate::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceCollection::ConstView input, AlpakaESTestDataEDevice::ConstView esData, portabletest::TestDeviceCollection::View output) const
Definition: TestAlgo.dev.cc:161

output
Definition: output.py:1

cms::alpakatest::AlpakaESTestDataE::ConstView::val2
constexpr int val2(int i) const
Definition: AlpakaESTestData.h:52

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdateMulti3::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestSoA::ConstView input, portabletest::TestSoA2::ConstView input2, portabletest::TestSoA3::ConstView input3, AlpakaESTestDataEDevice::ConstView esData, portabletest::TestSoA::View output, portabletest::TestSoA2::View output2, portabletest::TestSoA3::View output3) const
Definition: TestAlgo.dev.cc:217

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoMultiKernel3::operator()
ALPAKA_FN_ACC void operator()(TAcc const &acc, portabletest::TestDeviceMultiCollection3::View< 2 > view, double xvalue) const
Definition: TestAlgo.dev.cc:60

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::updateMulti3
portabletest::TestDeviceMultiCollection3 updateMulti3(Queue &queue, portabletest::TestDeviceMultiCollection3 const &input, AlpakaESTestDataEDevice const &esData) const
Definition: TestAlgo.dev.cc:309

config.h

ALPAKA_ACCELERATOR_NAMESPACE::portabletest::TestDeviceMultiCollection2
PortableCollection2< TestSoA, TestSoA2 > TestDeviceMultiCollection2
Definition: TestDeviceCollection.h:23

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgo::fillMulti3
void fillMulti3(Queue &queue, portabletest::TestDeviceMultiCollection3 &collection, double xvalue=0.) const
Definition: TestAlgo.dev.cc:137

sistrip::View
View
Definition: ConstantsForView.h:26

portabletest::TestSoALayout3
Definition: TestSoA.h:57

ALPAKA_ACCELERATOR_NAMESPACE::TestAlgoKernelUpdateMulti3
Definition: TestAlgo.dev.cc:214

skim900GeV_StreamA_MinBiasPD_cfg.output3
output3
Definition: skim900GeV_StreamA_MinBiasPD_cfg.py:240