d5/d3c/PixelClustering_8h_source.html

 #ifndef RecoLocalTracker_SiPixelClusterizer_alpaka_PixelClustering_h
 #define RecoLocalTracker_SiPixelClusterizer_alpaka_PixelClustering_h

 #include <cmath>
 #include <cstdint>
 #include <cstdio>
 #include <type_traits>

 #include <alpaka/alpaka.hpp>

 #include "DataFormats/SiPixelClusterSoA/interface/ClusteringConstants.h"
 #include "Geometry/CommonTopologies/interface/SimplePixelTopology.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/HistoContainer.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/SimpleVector.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/config.h"

 //#define GPU_DEBUG

 namespace ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering {

 #ifdef GPU_DEBUG
   template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
   ALPAKA_STATIC_ACC_MEM_GLOBAL uint32_t gMaxHit = 0;
 #endif

   namespace pixelStatus {
     // Phase-1 pixel modules
     constexpr uint32_t pixelSizeX = pixelTopology::Phase1::numRowsInModule;
     constexpr uint32_t pixelSizeY = pixelTopology::Phase1::numColsInModule;

     // Use 0x00, 0x01, 0x03 so each can be OR'ed on top of the previous ones
     enum Status : uint32_t { kEmpty = 0x00, kFound = 0x01, kDuplicate = 0x03 };

     constexpr uint32_t bits = 2;
     constexpr uint32_t mask = (0x01 << bits) - 1;
     constexpr uint32_t valuesPerWord = sizeof(uint32_t) * 8 / bits;
     constexpr uint32_t size = pixelSizeX * pixelSizeY / valuesPerWord;

     ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr uint32_t getIndex(uint16_t x, uint16_t y) {
       return (pixelSizeX * y + x) / valuesPerWord;
     }

     ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr uint32_t getShift(uint16_t x, uint16_t y) {
       return (x % valuesPerWord) * 2;
     }

     ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr Status getStatus(uint32_t const* __restrict__ status,
                                                               uint16_t x,
                                                               uint16_t y) {
       uint32_t index = getIndex(x, y);
       uint32_t shift = getShift(x, y);
       return Status{(status[index] >> shift) & mask};
     }

     ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr bool isDuplicate(uint32_t const* __restrict__ status,
                                                               uint16_t x,
                                                               uint16_t y) {
       return getStatus(status, x, y) == kDuplicate;
     }

     /* FIXME
        * In the more general case (e.g. a multithreaded CPU backend) there is a potential race condition
        * between the read of status[index] at line NNN and the atomicCas at line NNN.
        * We should investigate:
        *   - if `status` should be read through a `volatile` pointer (CUDA/ROCm)
        *   - if `status` should be read with an atomic load (CPU)
        */
     template <typename TAcc, typename = std::enable_if_t<alpaka::isAccelerator<TAcc>>>
     ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr void promote(TAcc const& acc,
                                                           uint32_t* __restrict__ status,
                                                           const uint16_t x,
                                                           const uint16_t y) {
       uint32_t index = getIndex(x, y);
       uint32_t shift = getShift(x, y);
       uint32_t old_word = status[index];
       uint32_t expected = old_word;
       do {
         expected = old_word;
         Status old_status{(old_word >> shift) & mask};
         if (kDuplicate == old_status) {
           // nothing to do
           return;
         }
         Status new_status = (kEmpty == old_status) ? kFound : kDuplicate;
         uint32_t new_word = old_word | (static_cast<uint32_t>(new_status) << shift);
         old_word = alpaka::atomicCas(acc, &status[index], expected, new_word, alpaka::hierarchy::Blocks{});
       } while (expected != old_word);
     }

   }  // namespace pixelStatus

   template <typename TrackerTraits>
   struct CountModules {
     template <typename TAcc>
     ALPAKA_FN_ACC void operator()(const TAcc& acc,
                                   SiPixelDigisSoAView digi_view,
                                   SiPixelClustersSoAView clus_view,
                                   const unsigned int numElements) const {
       // Make sure the atomicInc below does not overflow
       static_assert(TrackerTraits::numberOfModules < ::pixelClustering::maxNumModules);

 #ifdef GPU_DEBUG
       if (cms::alpakatools::once_per_grid(acc)) {
         printf("Starting to count modules to set module starts:");
       }
 #endif
       for (int32_t i : cms::alpakatools::uniform_elements(acc, numElements)) {
         digi_view[i].clus() = i;
         if (::pixelClustering::invalidModuleId == digi_view[i].moduleId())
           continue;

         int32_t j = i - 1;
         while (j >= 0 and digi_view[j].moduleId() == ::pixelClustering::invalidModuleId)
           --j;
         if (j < 0 or digi_view[j].moduleId() != digi_view[i].moduleId()) {
           // Found a module boundary: count the number of modules in  clus_view[0].moduleStart()
           auto loc = alpaka::atomicInc(acc,
                                        &clus_view[0].moduleStart(),
                                        static_cast<uint32_t>(::pixelClustering::maxNumModules),
                                        alpaka::hierarchy::Blocks{});
           ALPAKA_ASSERT_ACC(loc < TrackerTraits::numberOfModules);
 #ifdef GPU_DEBUG
           printf("> New module (no. %d) found at digi %d \n", loc, i);
 #endif
           clus_view[loc + 1].moduleStart() = i;
         }
       }
     }
   };

   template <typename TrackerTraits>
   struct FindClus {
     // assume that we can cover the whole module with up to 16 blockDimension-wide iterations
     static constexpr uint32_t maxIterGPU = 16;

     // this must be larger than maxPixInModule / maxIterGPU, and should be a multiple of the warp size
     static constexpr uint32_t maxElementsPerBlock =
         cms::alpakatools::round_up_by(TrackerTraits::maxPixInModule / maxIterGPU, 128);

     template <typename TAcc>
     ALPAKA_FN_ACC void operator()(const TAcc& acc,
                                   SiPixelDigisSoAView digi_view,
                                   SiPixelClustersSoAView clus_view,
                                   const unsigned int numElements) const {
       static_assert(TrackerTraits::numberOfModules < ::pixelClustering::maxNumModules);

       auto& lastPixel = alpaka::declareSharedVar<unsigned int, __COUNTER__>(acc);

       const uint32_t lastModule = clus_view[0].moduleStart();
       for (uint32_t module : cms::alpakatools::independent_groups(acc, lastModule)) {
         auto firstPixel = clus_view[1 + module].moduleStart();
         uint32_t thisModuleId = digi_view[firstPixel].moduleId();
         ALPAKA_ASSERT_ACC(thisModuleId < TrackerTraits::numberOfModules);

 #ifdef GPU_DEBUG
         if (thisModuleId % 100 == 1)
           if (cms::alpakatools::once_per_block(acc))
             printf("start clusterizer for module %4d in block %4d\n",
                    thisModuleId,
                    alpaka::getIdx<alpaka::Grid, alpaka::Blocks>(acc)[0u]);
 #endif

         // find the index of the first pixel not belonging to this module (or invalid)
         lastPixel = numElements;
         alpaka::syncBlockThreads(acc);

         // skip threads not associated to an existing pixel
         for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, numElements)) {
           auto id = digi_view[i].moduleId();
           // skip invalid pixels
           if (id == ::pixelClustering::invalidModuleId)
             continue;
           // find the first pixel in a different module
           if (id != thisModuleId) {
             alpaka::atomicMin(acc, &lastPixel, i, alpaka::hierarchy::Threads{});
             break;
           }
         }

         using Hist = cms::alpakatools::HistoContainer<uint16_t,
                                                       TrackerTraits::clusterBinning,
                                                       TrackerTraits::maxPixInModule,
                                                       TrackerTraits::clusterBits,
                                                       uint16_t>;
 #if defined(__HIP_DEVICE_COMPILE__)
         constexpr auto warpSize = __AMDGCN_WAVEFRONT_SIZE;
 #else
         constexpr auto warpSize = 32;
 #endif
         auto& hist = alpaka::declareSharedVar<Hist, __COUNTER__>(acc);
         auto& ws = alpaka::declareSharedVar<typename Hist::Counter[warpSize], __COUNTER__>(acc);
         for (uint32_t j : cms::alpakatools::independent_group_elements(acc, Hist::totbins())) {
           hist.off[j] = 0;
         }
         alpaka::syncBlockThreads(acc);

         ALPAKA_ASSERT_ACC((lastPixel == numElements) or
                           ((lastPixel < numElements) and (digi_view[lastPixel].moduleId() != thisModuleId)));
         // limit to maxPixInModule  (FIXME if recurrent (and not limited to simulation with low threshold) one will need to implement something cleverer)
         if (cms::alpakatools::once_per_block(acc)) {
           if (lastPixel - firstPixel > TrackerTraits::maxPixInModule) {
             printf("too many pixels in module %u: %u > %u\n",
                    thisModuleId,
                    lastPixel - firstPixel,
                    TrackerTraits::maxPixInModule);
             lastPixel = TrackerTraits::maxPixInModule + firstPixel;
           }
         }
         alpaka::syncBlockThreads(acc);
         ALPAKA_ASSERT_ACC(lastPixel - firstPixel <= TrackerTraits::maxPixInModule);

 #ifdef GPU_DEBUG
         auto& totGood = alpaka::declareSharedVar<uint32_t, __COUNTER__>(acc);
         totGood = 0;
         alpaka::syncBlockThreads(acc);
 #endif

         // remove duplicate pixels
         constexpr bool isPhase2 = std::is_base_of<pixelTopology::Phase2, TrackerTraits>::value;
         if constexpr (not isPhase2) {
           // packed words array used to store the pixelStatus of each pixel
           auto& status = alpaka::declareSharedVar<uint32_t[pixelStatus::size], __COUNTER__>(acc);

           if (lastPixel > 1) {
             for (uint32_t i : cms::alpakatools::independent_group_elements(acc, pixelStatus::size)) {
               status[i] = 0;
             }
             alpaka::syncBlockThreads(acc);

             for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, lastPixel - 1)) {
               // skip invalid pixels
               if (digi_view[i].moduleId() == ::pixelClustering::invalidModuleId)
                 continue;
               pixelStatus::promote(acc, status, digi_view[i].xx(), digi_view[i].yy());
             }
             alpaka::syncBlockThreads(acc);

             for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, lastPixel - 1)) {
               // skip invalid pixels
               if (digi_view[i].moduleId() == ::pixelClustering::invalidModuleId)
                 continue;
               if (pixelStatus::isDuplicate(status, digi_view[i].xx(), digi_view[i].yy())) {
                 digi_view[i].moduleId() = ::pixelClustering::invalidModuleId;
                 digi_view[i].rawIdArr() = 0;
               }
             }
             alpaka::syncBlockThreads(acc);
           }
         }

         // fill histo
         for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, lastPixel)) {
           // skip invalid pixels
           if (digi_view[i].moduleId() != ::pixelClustering::invalidModuleId) {
             hist.count(acc, digi_view[i].yy());
 #ifdef GPU_DEBUG
             alpaka::atomicAdd(acc, &totGood, 1u, alpaka::hierarchy::Blocks{});
 #endif
           }
         }
         alpaka::syncBlockThreads(acc);  // FIXME this can be removed
         for (uint32_t i : cms::alpakatools::independent_group_elements(acc, warpSize)) {
           ws[i] = 0;  // used by prefix scan...
         }
         alpaka::syncBlockThreads(acc);
         hist.finalize(acc, ws);
         alpaka::syncBlockThreads(acc);
 #ifdef GPU_DEBUG
         ALPAKA_ASSERT_ACC(hist.size() == totGood);
         if (thisModuleId % 100 == 1)
           if (cms::alpakatools::once_per_block(acc))
             printf("histo size %d\n", hist.size());
 #endif
         for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, lastPixel)) {
           // skip invalid pixels
           if (digi_view[i].moduleId() != ::pixelClustering::invalidModuleId) {
             hist.fill(acc, digi_view[i].yy(), i - firstPixel);
           }
         }

 #ifdef GPU_DEBUG
         // look for anomalous high occupancy
         auto& n40 = alpaka::declareSharedVar<uint32_t, __COUNTER__>(acc);
         auto& n60 = alpaka::declareSharedVar<uint32_t, __COUNTER__>(acc);
         if (cms::alpakatools::once_per_block(acc)) {
           n40 = 0;
           n60 = 0;
         }
         alpaka::syncBlockThreads(acc);
         for (uint32_t j : cms::alpakatools::independent_group_elements(acc, Hist::nbins())) {
           if (hist.size(j) > 60)
             alpaka::atomicAdd(acc, &n60, 1u, alpaka::hierarchy::Blocks{});
           if (hist.size(j) > 40)
             alpaka::atomicAdd(acc, &n40, 1u, alpaka::hierarchy::Blocks{});
         }
         alpaka::syncBlockThreads(acc);
         if (cms::alpakatools::once_per_block(acc)) {
           if (n60 > 0)
             printf("columns with more than 60 px %d in %d\n", n60, thisModuleId);
           else if (n40 > 0)
             printf("columns with more than 40 px %d in %d\n", n40, thisModuleId);
         }
         alpaka::syncBlockThreads(acc);
 #endif

         [[maybe_unused]] const uint32_t blockDimension = alpaka::getWorkDiv<alpaka::Block, alpaka::Elems>(acc)[0u];
         // assume that we can cover the whole module with up to maxIterGPU blockDimension-wide iterations
         ALPAKA_ASSERT_ACC((hist.size() / blockDimension) < maxIterGPU);

         // number of elements per thread
         constexpr uint32_t maxElements =
             cms::alpakatools::requires_single_thread_per_block_v<TAcc> ? maxElementsPerBlock : 1;
         ALPAKA_ASSERT_ACC((alpaka::getWorkDiv<alpaka::Thread, alpaka::Elems>(acc)[0u] <= maxElements));

         constexpr unsigned int maxIter = maxIterGPU * maxElements;

         // nearest neighbours (nn)
         // allocate space for duplicate pixels: a pixel can appear more than once with different charge in the same event
         constexpr int maxNeighbours = 10;
         uint16_t nn[maxIter][maxNeighbours];
         uint8_t nnn[maxIter];  // number of nn
         for (uint32_t k = 0; k < maxIter; ++k) {
           nnn[k] = 0;
         }

         alpaka::syncBlockThreads(acc);  // for hit filling!

         // fill the nearest neighbours
         uint32_t k = 0;
         for (uint32_t j : cms::alpakatools::independent_group_elements(acc, hist.size())) {
           ALPAKA_ASSERT_ACC(k < maxIter);
           auto p = hist.begin() + j;
           auto i = *p + firstPixel;
           ALPAKA_ASSERT_ACC(digi_view[i].moduleId() != ::pixelClustering::invalidModuleId);
           ALPAKA_ASSERT_ACC(digi_view[i].moduleId() == thisModuleId);  // same module
           auto bin = Hist::bin(digi_view[i].yy() + 1);
           auto end = hist.end(bin);
           ++p;
           ALPAKA_ASSERT_ACC(0 == nnn[k]);
           for (; p < end; ++p) {
             auto m = *p + firstPixel;
             ALPAKA_ASSERT_ACC(m != i);
             ALPAKA_ASSERT_ACC(int(digi_view[m].yy()) - int(digi_view[i].yy()) >= 0);
             ALPAKA_ASSERT_ACC(int(digi_view[m].yy()) - int(digi_view[i].yy()) <= 1);
             if (std::abs(int(digi_view[m].xx()) - int(digi_view[i].xx())) <= 1) {
               auto l = nnn[k]++;
               ALPAKA_ASSERT_ACC(l < maxNeighbours);
               nn[k][l] = *p;
             }
           }
           ++k;
         }

         // for each pixel, look at all the pixels until the end of the module;
         // when two valid pixels within +/- 1 in x or y are found, set their id to the minimum;
         // after the loop, all the pixel in each cluster should have the id equeal to the lowest
         // pixel in the cluster ( clus[i] == i ).
         bool more = true;
         /*
           int nloops = 0;
           */
         while (alpaka::syncBlockThreadsPredicate<alpaka::BlockOr>(acc, more)) {
           /*
             if (nloops % 2 == 0) {
               // even iterations of the outer loop
             */
           more = false;
           uint32_t k = 0;
           for (uint32_t j : cms::alpakatools::independent_group_elements(acc, hist.size())) {
             ALPAKA_ASSERT_ACC(k < maxIter);
             auto p = hist.begin() + j;
             auto i = *p + firstPixel;
             for (int kk = 0; kk < nnn[k]; ++kk) {
               auto l = nn[k][kk];
               auto m = l + firstPixel;
               ALPAKA_ASSERT_ACC(m != i);
               // FIXME ::Threads ?
               auto old = alpaka::atomicMin(acc, &digi_view[m].clus(), digi_view[i].clus(), alpaka::hierarchy::Blocks{});
               if (old != digi_view[i].clus()) {
                 // end the loop only if no changes were applied
                 more = true;
               }
               // FIXME ::Threads ?
               alpaka::atomicMin(acc, &digi_view[i].clus(), old, alpaka::hierarchy::Blocks{});
             }  // neighbours loop
             ++k;
           }  // pixel loop
              /*
               // use the outer loop to force a synchronisation
             } else {
               // odd iterations of the outer loop
             */
           alpaka::syncBlockThreads(acc);
           for (uint32_t j : cms::alpakatools::independent_group_elements(acc, hist.size())) {
             auto p = hist.begin() + j;
             auto i = *p + firstPixel;
             auto m = digi_view[i].clus();
             while (m != digi_view[m].clus())
               m = digi_view[m].clus();
             digi_view[i].clus() = m;
           }
           /*
             }
             ++nloops;
             */
         }  // end while

         /*
             // check that all threads in the block have executed the same number of iterations
             auto& n0 = alpaka::declareSharedVar<int, __COUNTER__>(acc);
             if (cms::alpakatools::once_per_block(acc))
               n0 = nloops;
             alpaka::syncBlockThreads(acc);
             ALPAKA_ASSERT_ACC(alpaka::syncBlockThreadsPredicate<alpaka::BlockAnd>(acc, nloops == n0));
             if (thisModuleId % 100 == 1)
               if (cms::alpakatools::once_per_block(acc))
                 printf("# loops %d\n", nloops);
           */

         auto& foundClusters = alpaka::declareSharedVar<unsigned int, __COUNTER__>(acc);
         foundClusters = 0;
         alpaka::syncBlockThreads(acc);

         // find the number of different clusters, identified by a pixels with clus[i] == i;
         // mark these pixels with a negative id.
         for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, lastPixel)) {
           // skip invalid pixels
           if (digi_view[i].moduleId() == ::pixelClustering::invalidModuleId)
             continue;
           if (digi_view[i].clus() == static_cast<int>(i)) {
             auto old = alpaka::atomicInc(acc, &foundClusters, 0xffffffff, alpaka::hierarchy::Threads{});
             digi_view[i].clus() = -(old + 1);
           }
         }
         alpaka::syncBlockThreads(acc);

         // propagate the negative id to all the pixels in the cluster.
         for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, lastPixel)) {
           // skip invalid pixels
           if (digi_view[i].moduleId() == ::pixelClustering::invalidModuleId)
             continue;
           if (digi_view[i].clus() >= 0) {
             // mark each pixel in a cluster with the same id as the first one
             digi_view[i].clus() = digi_view[digi_view[i].clus()].clus();
           }
         }
         alpaka::syncBlockThreads(acc);

         // adjust the cluster id to be a positive value starting from 0
         for (uint32_t i : cms::alpakatools::independent_group_elements(acc, firstPixel, lastPixel)) {
           if (digi_view[i].moduleId() == ::pixelClustering::invalidModuleId) {
             // mark invalid pixels with an invalid cluster index
             digi_view[i].clus() = ::pixelClustering::invalidClusterId;
           } else {
             digi_view[i].clus() = -digi_view[i].clus() - 1;
           }
         }
         alpaka::syncBlockThreads(acc);

         if (cms::alpakatools::once_per_block(acc)) {
           clus_view[thisModuleId].clusInModule() = foundClusters;
           clus_view[module].moduleId() = thisModuleId;
 #ifdef GPU_DEBUG
           if (foundClusters > gMaxHit<TAcc>) {
             gMaxHit<TAcc> = foundClusters;
             if (foundClusters > 8)
               printf("max hit %d in %d\n", foundClusters, thisModuleId);
           }
           if (thisModuleId % 100 == 1)
             printf("%d clusters in module %d\n", foundClusters, thisModuleId);
 #endif
         }
       }  // module loop
     }
   };

 }  // namespace ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering

 #endif  // plugin_SiPixelClusterizer_alpaka_PixelClustering.h
ALPAKA_ACCELERATOR_NAMESPACE::vertexFinder::Hist
cms::alpakatools::HistoContainer< uint8_t, 256, 16000, 8, uint16_t > Hist
Definition: clusterTracksByDensity.h:66

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::mask
constexpr uint32_t mask
Definition: PixelClustering.h:35

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::pixelSizeY
constexpr uint32_t pixelSizeY
Definition: PixelClustering.h:29

cms::alpakatools::once_per_block
ALPAKA_FN_ACC constexpr bool once_per_block(TAcc const &acc)
Definition: workdivision.h:1394

SimplePixelTopology.h

cms::alpakatools::uniform_elements
ALPAKA_FN_ACC auto uniform_elements(TAcc const &acc, TArgs... args)
Definition: workdivision.h:311

mps_fire.i
i
Definition: mps_fire.py:429

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::valuesPerWord
constexpr uint32_t valuesPerWord
Definition: PixelClustering.h:36

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::kDuplicate
Definition: PixelClustering.h:32

dqmiolumiharvest.j
j
Definition: dqmiolumiharvest.py:66

pixelTopology::Phase1::numColsInModule
static constexpr uint16_t numColsInModule
Definition: SimplePixelTopology.h:486

LaserClient_cfi.nbins
nbins
Definition: LaserClient_cfi.py:53

cms::alpakatools::independent_group_elements
ALPAKA_FN_ACC auto independent_group_elements(TAcc const &acc, TArgs... args)
Definition: workdivision.h:1329

shortTrackResolution_cff.isPhase2
isPhase2
Definition: shortTrackResolution_cff.py:15

cms::alpakatools::HistoContainer
Definition: HistoContainer.h:129

module
Definition: EcalSRCondTools.cc:29

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::pixelSizeX
constexpr uint32_t pixelSizeX
Definition: PixelClustering.h:28

pixelTopology::Phase1::numRowsInModule
static constexpr uint16_t numRowsInModule
Definition: SimplePixelTopology.h:485

cms::alpakatools::independent_groups
ALPAKA_FN_ACC auto independent_groups(TAcc const &acc, TArgs... args)
Definition: workdivision.h:1170

ALPAKA_ACCELERATOR_NAMESPACE::brokenline::constexpr
if constexpr(n > 3)
Definition: BrokenLine.h:164

phase1PixelTopology::numberOfModules
constexpr uint16_t numberOfModules
Definition: SimplePixelTopology.h:136

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::FindClus::operator()
ALPAKA_FN_ACC void operator()(const TAcc &acc, SiPixelDigisSoAView digi_view, SiPixelClustersSoAView clus_view, const unsigned int numElements) const
Definition: PixelClustering.h:141

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::bits
constexpr uint32_t bits
Definition: PixelClustering.h:34

newFWLiteAna.bin
bin
Definition: newFWLiteAna.py:157

callgraph.module
module
Definition: callgraph.py:69

ClusteringConstants.h

geometryCSVtoXML.yy
yy
Definition: geometryCSVtoXML.py:19

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::getIndex
ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr uint32_t getIndex(uint16_t x, uint16_t y)
Definition: PixelClustering.h:39

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::promote
ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr void promote(TAcc const &acc, uint32_t *__restrict__ status, const uint16_t x, const uint16_t y)
Definition: PixelClustering.h:69

compareTotals.hist
hist
Definition: compareTotals.py:64

gpuVertexFinder::more
bool more
Definition: gpuClusterTracksIterative.h:110

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::getShift
ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr uint32_t getShift(uint16_t x, uint16_t y)
Definition: PixelClustering.h:43

AlignmentPI::index
index
Definition: AlignmentPayloadInspectorHelper.h:93

SiPixelDigisLayout::ViewTemplateFreeParams
Definition: SiPixelDigisSoA.h:13

cms::cudacompat::atomicInc
T1 atomicInc(T1 *a, T2 b)
Definition: cudaCompat.h:48

or
The Signals That Services Can Subscribe To This is based on ActivityRegistry and is current per Services can connect to the signals distributed by the ActivityRegistry in order to monitor the activity of the application Each possible callback has some defined which we here list in angle e< void, edm::EventID const  &, edm::Timestamp const  & > We also list in braces which AR_WATCH_USING_METHOD_ is used for those or
Definition: Activities.doc:12

SimpleVector.h

cms::alpakatools::round_up_by
constexpr Idx round_up_by(Idx value, Idx divisor)
Definition: workdivision.h:17

SiPixelClustersLayout::ViewTemplateFreeParams
Definition: SiPixelClustersSoA.h:10

ALPAKA_ACCELERATOR_NAMESPACE::vertexFinder::ws
auto &__restrict__ ws
Definition: clusterTracksByDensity.h:48

visualization-live-secondInstance_cfg.m
m
Definition: visualization-live-secondInstance_cfg.py:84

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::kFound
Definition: PixelClustering.h:32

l1t::Blocks
std::vector< Block > Blocks
Definition: Block.h:99

funct::abs
Abs< T >::type abs(const T &t)
Definition: Abs.h:22

mps_update.status
status
Definition: mps_update.py:68

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::Status
Status
Definition: PixelClustering.h:32

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::kEmpty
Definition: PixelClustering.h:32

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::FindClus::maxElementsPerBlock
static constexpr uint32_t maxElementsPerBlock
Definition: PixelClustering.h:137

relativeConstraints.value
value
Definition: relativeConstraints.py:53

gpuClustering::invalidModuleId
constexpr uint16_t invalidModuleId
Definition: gpuClusteringConstants.h:23

gpuClustering::numElements
uint16_t *__restrict__ uint16_t const  *__restrict__ uint32_t const  *__restrict__ uint32_t *__restrict__ uint32_t const  *__restrict__ int32_t *__restrict__ uint32_t numElements
Definition: gpuClusterChargeCut.h:25

geometryCSVtoXML.xx
xx
Definition: geometryCSVtoXML.py:19

ALPAKA_ACCELERATOR_NAMESPACE::vertexFinder::foundClusters
auto & foundClusters
Definition: clusterTracksByDensity.h:196

gpuClustering::moduleStart
uint16_t *__restrict__ uint16_t const  *__restrict__ uint32_t const  *__restrict__ moduleStart
Definition: gpuClusterChargeCut.h:19

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::FindClus
Definition: PixelClustering.h:132

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::CountModules::operator()
ALPAKA_FN_ACC void operator()(const TAcc &acc, SiPixelDigisSoAView digi_view, SiPixelClustersSoAView clus_view, const unsigned int numElements) const
Definition: PixelClustering.h:95

cms::alpakatools::once_per_grid
ALPAKA_FN_ACC constexpr bool once_per_grid(TAcc const &acc)
Definition: workdivision.h:1382

GetRecoTauVFromDQM_MC_cff.kk
kk
Definition: GetRecoTauVFromDQM_MC_cff.py:84

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::FindClus::maxIterGPU
static constexpr uint32_t maxIterGPU
Definition: PixelClustering.h:134

groupFilesInBlocks.nn
nn
Definition: groupFilesInBlocks.py:150

edm::shift
static unsigned int const shift
Definition: LuminosityBlockID.cc:7

gpuClustering::moduleId
uint16_t *__restrict__ uint16_t const  *__restrict__ uint32_t const  *__restrict__ uint32_t *__restrict__ uint32_t const  *__restrict__ moduleId
Definition: gpuClusterChargeCut.h:19

x
float x
Definition: beamSpotDipStandalone.cc:55

gpuClustering::invalidClusterId
constexpr int invalidClusterId
Definition: gpuClusteringConstants.h:24

pixelClustering::maxNumModules
constexpr uint16_t maxNumModules
Definition: ClusteringConstants.h:26

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::isDuplicate
ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr bool isDuplicate(uint32_t const *__restrict__ status, uint16_t x, uint16_t y)
Definition: PixelClustering.h:55

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::getStatus
ALPAKA_FN_ACC ALPAKA_FN_INLINE constexpr Status getStatus(uint32_t const *__restrict__ status, uint16_t x, uint16_t y)
Definition: PixelClustering.h:47

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::pixelStatus::size
constexpr uint32_t size
Definition: PixelClustering.h:37

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering
Definition: PixelClustering.h:19

cms::cudacompat::atomicMin
T1 atomicMin(T1 *a, T2 b)
Definition: cudaCompat.h:85

config.h

ALPAKA_ACCELERATOR_NAMESPACE::caPixelDoublets::ALPAKA_ASSERT_ACC
ALPAKA_ASSERT_ACC(offsets)

HistoContainer.h

cms::cudacompat::atomicAdd
T1 atomicAdd(T1 *a, T2 b)
Definition: cudaCompat.h:61

ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering::CountModules
Definition: PixelClustering.h:93

AlCaHLTBitMon_ParallelJobs.p
def p
Definition: AlCaHLTBitMon_ParallelJobs.py:153

pixelClustering::invalidModuleId
constexpr uint16_t invalidModuleId
Definition: ClusteringConstants.h:29

dqmdumpme.k
k
Definition: dqmdumpme.py:60

MainPageGenerator.l
l
Definition: MainPageGenerator.py:429