d9/d97/workdivision_8h_source.html

 #ifndef HeterogeneousCore_AlpakaInterface_interface_workdivision_h
 #define HeterogeneousCore_AlpakaInterface_interface_workdivision_h

 #include <type_traits>

 #include <alpaka/alpaka.hpp>

 #include "HeterogeneousCore/AlpakaInterface/interface/config.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/traits.h"
 #include "HeterogeneousCore/AlpakaInterface/interface/vec.h"

 namespace cms::alpakatools {

   using namespace alpaka_common;

   // If the first argument is not a multiple of the second argument, round it up to the next multiple
   inline constexpr Idx round_up_by(Idx value, Idx divisor) { return (value + divisor - 1) / divisor * divisor; }

   // Return the integer division of the first argument by the second argument, rounded up to the next integer
   inline constexpr Idx divide_up_by(Idx value, Idx divisor) { return (value + divisor - 1) / divisor; }

   // Create an accelerator-dependent work division for 1-dimensional kernels
   template <typename TAcc,
             typename = std::enable_if_t<cms::alpakatools::is_accelerator_v<TAcc> and alpaka::Dim<TAcc>::value == 1>>
   inline WorkDiv<Dim1D> make_workdiv(Idx blocks, Idx elements) {
 #ifdef ALPAKA_ACC_GPU_CUDA_ENABLED
     if constexpr (std::is_same_v<TAcc, alpaka::AccGpuCudaRt<Dim1D, Idx>>) {
       // On GPU backends, each thread is looking at a single element:
       //   - the number of threads per block is "elements";
       //   - the number of elements per thread is always 1.
       return WorkDiv<Dim1D>(blocks, elements, Idx{1});
     } else
 #endif  // ALPAKA_ACC_GPU_CUDA_ENABLED
 #if ALPAKA_ACC_GPU_HIP_ENABLED
         if constexpr (std::is_same_v<TAcc, alpaka::AccGpuHipRt<Dim1D, Idx>>) {
       // On GPU backends, each thread is looking at a single element:
       //   - the number of threads per block is "elements";
       //   - the number of elements per thread is always 1.
       return WorkDiv<Dim1D>(blocks, elements, Idx{1});
     } else
 #endif  // ALPAKA_ACC_GPU_HIP_ENABLED
     {
       // On CPU backends, run serially with a single thread per block:
       //   - the number of threads per block is always 1;
       //   - the number of elements per thread is "elements".
       return WorkDiv<Dim1D>(blocks, Idx{1}, elements);
     }
   }

   // Create the accelerator-dependent workdiv for N-dimensional kernels
   template <typename TAcc, typename = std::enable_if_t<cms::alpakatools::is_accelerator_v<TAcc>>>
   inline WorkDiv<alpaka::Dim<TAcc>> make_workdiv(const Vec<alpaka::Dim<TAcc>>& blocks,
                                                  const Vec<alpaka::Dim<TAcc>>& elements) {
     using Dim = alpaka::Dim<TAcc>;
 #ifdef ALPAKA_ACC_GPU_CUDA_ENABLED
     if constexpr (std::is_same_v<TAcc, alpaka::AccGpuCudaRt<Dim, Idx>>) {
       // On GPU backends, each thread is looking at a single element:
       //   - the number of threads per block is "elements";
       //   - the number of elements per thread is always 1.
       return WorkDiv<Dim>(blocks, elements, Vec<Dim>::ones());
     } else
 #endif  // ALPAKA_ACC_GPU_CUDA_ENABLED
 #ifdef ALPAKA_ACC_GPU_HIP_ENABLED
         if constexpr (std::is_same_v<TAcc, alpaka::AccGpuHipRt<Dim, Idx>>) {
       // On GPU backends, each thread is looking at a single element:
       //   - the number of threads per block is "elements";
       //   - the number of elements per thread is always 1.
       return WorkDiv<Dim>(blocks, elements, Vec<Dim>::ones());
     } else
 #endif  // ALPAKA_ACC_GPU_HIP_ENABLED
     {
       // On CPU backends, run serially with a single thread per block:
       //   - the number of threads per block is always 1;
       //   - the number of elements per thread is "elements".
       return WorkDiv<Dim>(blocks, Vec<Dim>::ones(), elements);
     }
   }

   template <typename TAcc,
             typename = std::enable_if_t<cms::alpakatools::is_accelerator_v<TAcc> and alpaka::Dim<TAcc>::value == 1>>
   class elements_with_stride {
   public:
     ALPAKA_FN_ACC inline elements_with_stride(TAcc const& acc)
         : elements_{alpaka::getWorkDiv<alpaka::Thread, alpaka::Elems>(acc)[0u]},
           first_{alpaka::getIdx<alpaka::Grid, alpaka::Threads>(acc)[0u] * elements_},
           stride_{alpaka::getWorkDiv<alpaka::Grid, alpaka::Threads>(acc)[0u] * elements_},
           extent_{stride_} {}

     ALPAKA_FN_ACC inline elements_with_stride(TAcc const& acc, Idx extent)
         : elements_{alpaka::getWorkDiv<alpaka::Thread, alpaka::Elems>(acc)[0u]},
           first_{alpaka::getIdx<alpaka::Grid, alpaka::Threads>(acc)[0u] * elements_},
           stride_{alpaka::getWorkDiv<alpaka::Grid, alpaka::Threads>(acc)[0u] * elements_},
           extent_{extent} {}

     class iterator {
       friend class elements_with_stride;

       ALPAKA_FN_ACC inline iterator(Idx elements, Idx stride, Idx extent, Idx first)
           : elements_{elements},
             stride_{stride},
             extent_{extent},
             first_{std::min(first, extent)},
             index_{first_},
             last_{std::min(first + elements, extent)} {}

     public:
       ALPAKA_FN_ACC inline Idx operator*() const { return index_; }

       // pre-increment the iterator
       ALPAKA_FN_ACC inline iterator& operator++() {
         // increment the index along the elements processed by the current thread
         ++index_;
         if (index_ < last_)
           return *this;

         // increment the thread index with the grid stride
         first_ += stride_ * elements_;
         index_ = first_;
         last_ = std::min(first_ + elements_, extent_);
         if (index_ < extent_)
           return *this;

         // the iterator has reached or passed the end of the extent, clamp it to the extent
         first_ = extent_;
         index_ = extent_;
         last_ = extent_;
         return *this;
       }

       // post-increment the iterator
       ALPAKA_FN_ACC inline iterator operator++(int) {
         iterator old = *this;
         ++(*this);
         return old;
       }

       ALPAKA_FN_ACC inline bool operator==(iterator const& other) const {
         return (index_ == other.index_) and (first_ == other.first_);
       }

       ALPAKA_FN_ACC inline bool operator!=(iterator const& other) const { return not(*this == other); }

     private:
       // non-const to support iterator copy and assignment
       Idx elements_;
       Idx stride_;
       Idx extent_;
       // modified by the pre/post-increment operator
       Idx first_;
       Idx index_;
       Idx last_;
     };

     ALPAKA_FN_ACC inline iterator begin() const { return iterator(elements_, stride_, extent_, first_); }

     ALPAKA_FN_ACC inline iterator end() const { return iterator(elements_, stride_, extent_, extent_); }

   private:
     const Idx elements_;
     const Idx first_;
     const Idx stride_;
     const Idx extent_;
   };

   template <typename TAcc,
             typename = std::enable_if_t<cms::alpakatools::is_accelerator_v<TAcc> and (alpaka::Dim<TAcc>::value > 0)>>
   class elements_with_stride_nd {
   public:
     using Dim = alpaka::Dim<TAcc>;
     using Vec = alpaka::Vec<Dim, Idx>;

     ALPAKA_FN_ACC inline elements_with_stride_nd(TAcc const& acc)
         : elements_{alpaka::getWorkDiv<alpaka::Thread, alpaka::Elems>(acc)},
           first_{alpaka::getIdx<alpaka::Grid, alpaka::Threads>(acc) * elements_},
           stride_{alpaka::getWorkDiv<alpaka::Grid, alpaka::Threads>(acc) * elements_},
           extent_{stride_} {}

     ALPAKA_FN_ACC inline elements_with_stride_nd(TAcc const& acc, Vec extent)
         : elements_{alpaka::getWorkDiv<alpaka::Thread, alpaka::Elems>(acc)},
           first_{alpaka::getIdx<alpaka::Grid, alpaka::Threads>(acc) * elements_},
           stride_{alpaka::getWorkDiv<alpaka::Grid, alpaka::Threads>(acc) * elements_},
           extent_{extent} {}

     class iterator {
       friend class elements_with_stride_nd;
       constexpr static const auto last_dimension = Dim::value - 1;

       ALPAKA_FN_ACC inline iterator(Vec elements, Vec stride, Vec extent, Vec first)
           : elements_{elements},
             stride_{stride},
             extent_{extent},
             first_{alpaka::elementwise_min(first, extent)},
             index_{first_},
             last_{std::min(first[last_dimension] + elements[last_dimension], extent[last_dimension])} {}

     public:
       ALPAKA_FN_ACC inline Vec operator*() const { return index_; }

       // pre-increment the iterator
       ALPAKA_FN_ACC inline iterator& operator++() {
         // increment the index along the elements processed by the current thread
         ++index_[last_dimension];
         if (index_[last_dimension] < last_)
           return *this;

         // increment the thread index along with the last dimension with the grid stride
         first_[last_dimension] += stride_[last_dimension] * elements_[last_dimension];
         index_[last_dimension] = first_[last_dimension];
         last_ = std::min(first_[last_dimension] + elements_[last_dimension], extent_[last_dimension]);
         if (index_[last_dimension] < extent_[last_dimension])
           return *this;

         // increment the thread index along the outer dimensions with the grid stride
         if constexpr (last_dimension > 0)
           for (auto dimension = last_dimension - 1; dimension >= 0; --dimension) {
             first_[dimension] += stride_[dimension];
             index_[dimension] = first_[dimension];
             if (index_[dimension] < extent_[dimension])
               return *this;
           }

         // the iterator has reached or passed the end of the extent, clamp it to the extent
         first_ = extent_;
         index_ = extent_;
         last_ = extent_[last_dimension];
         return *this;
       }

       // post-increment the iterator
       ALPAKA_FN_ACC inline iterator operator++(int) {
         iterator old = *this;
         ++(*this);
         return old;
       }

       ALPAKA_FN_ACC inline bool operator==(iterator const& other) const {
         return (index_ == other.index_) and (first_ == other.first_);
       }

       ALPAKA_FN_ACC inline bool operator!=(iterator const& other) const { return not(*this == other); }

     private:
       // non-const to support iterator copy and assignment
       Vec elements_;
       Vec stride_;
       Vec extent_;
       // modified by the pre/post-increment operator
       Vec first_;
       Vec index_;
       Idx last_;
     };

     ALPAKA_FN_ACC inline iterator begin() const { return iterator(elements_, stride_, extent_, first_); }

     ALPAKA_FN_ACC inline iterator end() const { return iterator(elements_, stride_, extent_, extent_); }

   private:
     const Vec elements_;
     const Vec first_;
     const Vec stride_;
     const Vec extent_;
   };

 }  // namespace cms::alpakatools

 #endif  // HeterogeneousCore_AlpakaInterface_interface_workdivision_h
first
auto first
Definition: CAHitNtupletGeneratorKernelsImpl.h:127

cms::alpakatools::elements_with_stride_nd::elements_with_stride_nd
ALPAKA_FN_ACC elements_with_stride_nd(TAcc const &acc, Vec extent)
Definition: workdivision.h:178

cms::alpakatools::elements_with_stride::iterator::index_
Idx index_
Definition: workdivision.h:150

cms::alpakatools::elements_with_stride::first_
const Idx first_
Definition: workdivision.h:160

cms::alpakatools::elements_with_stride::elements_with_stride
ALPAKA_FN_ACC elements_with_stride(TAcc const &acc)
Definition: workdivision.h:83

cms::alpakatools::elements_with_stride::iterator::last_
Idx last_
Definition: workdivision.h:151

cms::alpakatools::make_workdiv
WorkDiv< Dim1D > make_workdiv(Idx blocks, Idx elements)
Definition: workdivision.h:25

cms::alpakatools::divide_up_by
constexpr Idx divide_up_by(Idx value, Idx divisor)
Definition: workdivision.h:20

cms::alpakatools::elements_with_stride::elements_with_stride
ALPAKA_FN_ACC elements_with_stride(TAcc const &acc, Idx extent)
Definition: workdivision.h:89

cms::alpakatools::elements_with_stride::iterator::elements_
Idx elements_
Definition: workdivision.h:145

alpaka::elementwise_min
ALPAKA_NO_HOST_ACC_WARNING ALPAKA_FN_HOST_ACC constexpr auto elementwise_min(Vec< TDim, TVal > const &p, Vecs const &... qs) -> Vec< TDim, TVal >
Definition: vec.h:16

cms::alpakatools::elements_with_stride_nd::iterator::iterator
ALPAKA_FN_ACC iterator(Vec elements, Vec stride, Vec extent, Vec first)
Definition: workdivision.h:188

cms::alpakatools::elements_with_stride_nd::iterator
Definition: workdivision.h:184

alpaka_common::Idx
uint32_t Idx
Definition: config.h:13

cms::alpakatools::elements_with_stride_nd::iterator::last_
Idx last_
Definition: workdivision.h:250

cms::alpakatools::elements_with_stride_nd
Definition: workdivision.h:167

cms::alpakatools::elements_with_stride_nd::elements_
const Vec elements_
Definition: workdivision.h:258

cms::alpakatools::elements_with_stride::begin
ALPAKA_FN_ACC iterator begin() const
Definition: workdivision.h:154

cms::alpakatools::elements_with_stride::iterator::stride_
Idx stride_
Definition: workdivision.h:146

cms::alpakatools::elements_with_stride::iterator
Definition: workdivision.h:95

alpaka_common
Definition: config.h:10

cms::alpakatools::elements_with_stride_nd::iterator::operator*
ALPAKA_FN_ACC Vec operator*() const
Definition: workdivision.h:197

cms::alpakatools
Definition: Product.h:17

cms::alpakatools::elements_with_stride::iterator::first_
Idx first_
Definition: workdivision.h:149

cms::alpakatools::elements_with_stride::iterator::extent_
Idx extent_
Definition: workdivision.h:147

cms::alpakatools::elements_with_stride_nd::elements_with_stride_nd
ALPAKA_FN_ACC elements_with_stride_nd(TAcc const &acc)
Definition: workdivision.h:172

gather_cfg.blocks
blocks
Definition: gather_cfg.py:90

alpaka_common::WorkDiv
alpaka::WorkDivMembers< TDim, Idx > WorkDiv
Definition: config.h:30

cms::alpakatools::elements_with_stride_nd::iterator::elements_
Vec elements_
Definition: workdivision.h:244

cms::alpakatools::elements_with_stride::stride_
const Idx stride_
Definition: workdivision.h:161

cms::alpakatools::elements_with_stride::iterator::operator*
ALPAKA_FN_ACC Idx operator*() const
Definition: workdivision.h:107

cms::alpakatools::elements_with_stride_nd::iterator::operator++
ALPAKA_FN_ACC iterator operator++(int)
Definition: workdivision.h:230

trackingPlots.other
other
Definition: trackingPlots.py:1464

cms::alpakatools::elements_with_stride_nd::iterator::stride_
Vec stride_
Definition: workdivision.h:245

cms::alpakatools::elements_with_stride::end
ALPAKA_FN_ACC iterator end() const
Definition: workdivision.h:156

cms::alpakatools::round_up_by
constexpr Idx round_up_by(Idx value, Idx divisor)
Definition: workdivision.h:17

cms::alpakatools::elements_with_stride::iterator::iterator
ALPAKA_FN_ACC iterator(Idx elements, Idx stride, Idx extent, Idx first)
Definition: workdivision.h:98

SiStripPI::min
Definition: SiStripPayloadInspectorHelper.h:178

cms::alpakatools::elements_with_stride_nd::iterator::operator!=
ALPAKA_FN_ACC bool operator!=(iterator const &other) const
Definition: workdivision.h:240

cms::alpakatools::elements_with_stride::extent_
const Idx extent_
Definition: workdivision.h:162

value
Definition: value.py:1

cms::alpakatools::elements_with_stride_nd::end
ALPAKA_FN_ACC iterator end() const
Definition: workdivision.h:255

relativeConstraints.value
value
Definition: relativeConstraints.py:53

traits.h

cms::alpakatools::elements_with_stride_nd::Vec
alpaka::Vec< Dim, Idx > Vec
Definition: workdivision.h:170

cms::alpakatools::elements_with_stride::iterator::operator++
ALPAKA_FN_ACC iterator operator++(int)
Definition: workdivision.h:131

cms::alpakatools::elements_with_stride
Definition: workdivision.h:81

cms::alpakatools::elements_with_stride_nd::first_
const Vec first_
Definition: workdivision.h:259

cms::alpakatools::elements_with_stride_nd::iterator::extent_
Vec extent_
Definition: workdivision.h:246

alpaka_common::Vec
alpaka::Vec< TDim, Idx > Vec
Definition: config.h:23

cms::alpakatools::elements_with_stride_nd::extent_
const Vec extent_
Definition: workdivision.h:261

cms::alpakatools::elements_with_stride_nd::Dim
alpaka::Dim< TAcc > Dim
Definition: workdivision.h:169

cms::alpakatools::elements_with_stride_nd::iterator::operator==
ALPAKA_FN_ACC bool operator==(iterator const &other) const
Definition: workdivision.h:236

cms::alpakatools::elements_with_stride::iterator::operator==
ALPAKA_FN_ACC bool operator==(iterator const &other) const
Definition: workdivision.h:137

cms::alpakatools::elements_with_stride_nd::iterator::operator++
ALPAKA_FN_ACC iterator & operator++()
Definition: workdivision.h:200

cms::alpakatools::elements_with_stride_nd::begin
ALPAKA_FN_ACC iterator begin() const
Definition: workdivision.h:253

cms::alpakatools::elements_with_stride_nd::iterator::first_
Vec first_
Definition: workdivision.h:248

cms::alpakatools::elements_with_stride_nd::stride_
const Vec stride_
Definition: workdivision.h:260

cms::alpakatools::elements_with_stride::iterator::operator++
ALPAKA_FN_ACC iterator & operator++()
Definition: workdivision.h:110

config.h

gpuPixelDoublets::stride
auto stride
Definition: gpuPixelDoubletsAlgos.h:80

pat::helper::ParametrizationHelper::dimension
uint32_t dimension(pat::CandKinResolution::Parametrization parametrization)
Returns the number of free parameters in a parametrization (3 or 4)
Definition: ParametrizationHelper.h:12

cms::alpakatools::elements_with_stride_nd::iterator::index_
Vec index_
Definition: workdivision.h:249

bookConverter.elements
elements
Definition: bookConverter.py:147

cms::alpakatools::elements_with_stride::iterator::operator!=
ALPAKA_FN_ACC bool operator!=(iterator const &other) const
Definition: workdivision.h:141

vec.h

cms::alpakatools::elements_with_stride::elements_
const Idx elements_
Definition: workdivision.h:159