|
|
using | ConstViewType = typename ViewType::ConstViewType |
| | Type of constant segments view.
|
|
using | IndexAllocatorType = IndexAllocator |
|
using | OffsetsContainer = Containers::Vector< Index, Device, typename Base::IndexType, IndexAllocator > |
| template<typename Device_ = Device, typename Index_ = Index, typename IndexAllocator_ = typename Allocators::Default< Device_ >::template Allocator< Index_ >, ElementsOrganization Organization_ = Organization, int WarpSize_ = WarpSize> |
| using | Self = BiEllpack< Device_, Index_, IndexAllocator_, Organization_, WarpSize_ > |
| | Templated type for creating BiEllpack segments with different template parameters.
|
| template<typename Device_ = Device, typename Index_ = Index> |
| using | ViewTemplate = BiEllpackView< Device_, Index_, Organization, WarpSize > |
| | Templated view type.
|
|
using | ViewType = BiEllpackView< Device, Index, Organization, WarpSize > |
| | Type of segments view.
|
|
using | ConstOffsetsView |
| | The type for representing the constant vector view with offsets of the BiEllpack groups.
|
|
using | DeviceType |
| | The device where the segments are operating.
|
|
using | IndexType |
| | The type used for indexing of segments elements.
|
|
using | OffsetsView |
| | The type for representing the vector view with offsets of the BiEllpack groups.
|
|
using | SegmentViewType |
| | Accessor type for one particular segment.
|
|
|
| BiEllpack ()=default |
| | Constructor with no parameters to create empty segments.
|
|
| BiEllpack (BiEllpack &&segments) noexcept=default |
| | Move constructor.
|
|
| BiEllpack (const BiEllpack &segments) |
| | Copy constructor (makes deep copy).
|
| template<typename SizesContainer, std::enable_if_t< IsArrayType< SizesContainer >::value, bool > = true> |
| | BiEllpack (const SizesContainer &segmentsSizes) |
| | Constructor that initializes segments based on their sizes.
|
| template<typename ListIndex> |
| | BiEllpack (const std::initializer_list< ListIndex > &segmentsSizes) |
| | Constructor that initializes segments using an initializer list.
|
|
ConstViewType | getConstView () const |
| | Returns a constant view for this instance of segments which can by used for example in lambda functions running in GPU kernels.
|
|
ViewType | getView () |
| | Returns a view for this instance of segments which can by used for example in lambda functions running in GPU kernels.
|
|
template<typename SizesHolder> |
| void | initGroupPointers (const SizesHolder &segmentsSizes) |
| void | load (File &file) |
| | Method for loading the segments from a file in a binary form.
|
|
BiEllpack & | operator= (BiEllpack &&segments) noexcept(false) |
| | Move-assignment operator.
|
|
BiEllpack & | operator= (const BiEllpack &segments) |
| | Copy-assignment operator (makes a deep copy).
|
| template<typename Device_, typename Index_, typename IndexAllocator_, ElementsOrganization Organization_> |
| BiEllpack & | operator= (const BiEllpack< Device_, Index_, IndexAllocator_, Organization_, WarpSize > &segments) |
| | Assignment operator for segments with different template parameters.
|
|
void | reset () |
| | Reset the segments to empty states (it means that there is no segment in the segments).
|
| void | save (File &file) const |
| | Method for saving the segments to a file in a binary form.
|
| template<typename SizesHolder> |
| void | setSegmentsSizes (const SizesHolder &sizes) |
| | Set sizes of particular segments.
|
|
__cuda_callable__ | BiEllpackBase ()=default |
| | Default constructor with no parameters to create empty segments view.
|
|
void | forAllElements (Function &&function) const |
|
void | forAllElementsIf (Condition condition, Function function) const |
|
void | forAllSegments (Function &&function) const |
|
void | forElements (IndexType begin, IndexType end, Function &&function) const |
|
void | forElementsIf (IndexType begin, IndexType end, Condition condition, Function function) const |
|
void | forSegments (IndexType begin, IndexType end, Function &&function) const |
|
__cuda_callable__ IndexType | getElementCount () const |
| | Returns the number of elements managed by all segments.
|
| __cuda_callable__ IndexType | getGlobalIndex (Index segmentIdx, Index localIdx) const |
| | Computes the global index of an element managed by the segments.
|
|
__cuda_callable__ OffsetsView | getGroupPointersView () |
| | Returns a view containing the pointers to the beginning of each segment.
|
|
__cuda_callable__ IndexType | getSegmentCount () const |
| | Returns the number of segments.
|
|
__cuda_callable__ IndexType | getSegmentsCount () const |
| | Returns the number of segments. Deprecated, use getSegmentCount().
|
|
__cuda_callable__ IndexType | getSegmentSize (IndexType segmentIdx) const |
| | Returns the size of a particular segment denoted by segmentIdx.
|
|
__cuda_callable__ OffsetsView | getSegmentsPermutationView () |
| | Returns a view containing the permutation of segments.
|
| __cuda_callable__ SegmentViewType | getSegmentView (IndexType segmentIdx) const |
| | Returns a segment view (i.e., a segment accessor) for the specified segment index.
|
|
__cuda_callable__ IndexType | getSize () const |
| | Returns the number of elements managed by all segments.
|
|
__cuda_callable__ IndexType | getStorageSize () const |
| | Returns number of elements that needs to be allocated by a container connected to this segments.
|
|
__cuda_callable__ IndexType | getVirtualSegments () const |
|
BiEllpackBase & | operator= (const BiEllpackBase &)=delete |
| | Copy-assignment operator.
|
|
void | printStructure (std::ostream &str) const |
| | Prints the structure of the segments to the specified output stream.
|
template<typename Device, typename Index, typename IndexAllocator = typename Allocators::Default< Device >::template Allocator< Index >,
ElementsOrganization Organization = DefaultElementsOrganization< Device >::getOrganization(), int WarpSize = Backend::getWarpSize()>
class TNL::Algorithms::Segments::BiEllpack< Device, Index, IndexAllocator, Organization, WarpSize >
Data structure for Bisection Ellpack segments.
Bisection Ellpack segments are inspired by the following paper:
[C. Zheng, S. Gu, T.-X. Gu, B. Yang, X.-P. Liu, BiELL: A bisection ELLPACK-based storage format for optimizing SpMV on GPUs, Journal of Parallel and Distributed Computing, Volume 74, Issue 7, 2014, pp. 2639-2647](https://www.sciencedirect.com/science/article/pii/S0743731514000458).
This format is designed to improve load balancing for segments with unevenly distributed sizes. It uses more meta-information compared to, for example, TNL::Algorithms::Segments::CSR, which can introduce overhead. However, it can be beneficial for reduction operations, particularly for longer segments with significant size variations.
See TNL::Algorithms::Segments for more details about segments.
- Template Parameters
-
| Device | The type of device on which the segments will operate. |
| Index | The type used for indexing elements managed by the segments. |
| IndexAllocator | The allocator used for managing index containers. |
| Organization | The organization of the elements in the segments—either row-major or column-major order. |
| WarpSize | The warp size used for the segments. |