Class muda::DeviceSegmentedReduce
ClassList > muda > DeviceSegmentedReduce
Inherits the following classes: muda::CubWrapper
Public Types inherited from muda::LaunchBase
See muda::LaunchBase
| Type | Name |
|---|---|
| typedef T | derived_type |
Public Attributes inherited from muda::CubWrapper
See muda::CubWrapper
| Type | Name |
|---|---|
| Stream * | m_muda_stream = = nullptr |
Public Functions
| Type | Name |
|---|---|
| DeviceSegmentedReduce & | ArgMax (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | ArgMax (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_items) |
| DeviceSegmentedReduce & | ArgMax (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | ArgMin (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | ArgMin (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | Max (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | Max (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | Min (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | Min (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | Reduce (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets, ReductionOp reduction_op, T initial_value) |
| DeviceSegmentedReduce & | Reduce (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets, ReductionOp reduction_op, T initial_value) |
| DeviceSegmentedReduce & | Sum (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
| DeviceSegmentedReduce & | Sum (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
Public Functions inherited from muda::CubWrapper
See muda::CubWrapper
| Type | Name |
|---|---|
| CubWrapper (Stream & stream=Stream::Default()) |
|
| void | kernel_name (std::string_view) = delete |
Public Functions inherited from muda::LaunchBase
See muda::LaunchBase
| Type | Name |
|---|---|
| MUDA_GENERIC | LaunchBase (::cudaStream_t stream) |
| T & | callback (const std::function< void(::cudaStream_t, ::cudaError)> & callback) |
| T & | file_line (std::string_view file, int line) |
| T & | kernel_name (std::string_view name) |
| Next | next (Next n) |
| Next | next (Args &&... args) |
| T & | pop_range () |
| T & | push_range (const std::string & name) |
| T & | record (cudaEvent_t e, int flag=cudaEventRecordDefault) |
| T & | record (ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
| T & | record (ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
| T & | wait (cudaEvent_t e, int flag=cudaEventWaitDefault) |
| T & | wait (const ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
| T & | wait (const ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
| T & | wait () |
| T & | when (cudaEvent_t e, int flag=cudaEventWaitDefault) |
| ~LaunchBase () |
Public Functions inherited from muda::LaunchCore
See muda::LaunchCore
| Type | Name |
|---|---|
| MUDA_GENERIC | LaunchCore (::cudaStream_t stream) |
| void | callback (const std::function< void(::cudaStream_t, ::cudaError)> & callback) |
| void | init_stream (::cudaStream_t s) |
| void | pop_range () |
| void | push_range (const std::string & name) |
| void | record (cudaEvent_t e, int flag=cudaEventRecordDefault) |
| void | record (ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
| void | record (ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
| void | wait (cudaEvent_t e, int flag=cudaEventWaitDefault) |
| void | wait (const ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
| void | wait (const ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
| void | wait () |
| void | when (cudaEvent_t e, int flag=cudaEventWaitDefault) |
| ~LaunchCore () |
Public Static Functions inherited from muda::LaunchCore
See muda::LaunchCore
| Type | Name |
|---|---|
| void | file_line (std::string_view file, int line) |
| void | kernel_name (std::string_view name) |
| void | wait_device () |
| void | wait_event (cudaEvent_t event) |
| void | wait_stream (::cudaStream_t stream) |
Protected Types inherited from muda::LaunchCore
See muda::LaunchCore
| Type | Name |
|---|---|
| typedef std::shared_ptr< T > | S |
Protected Attributes inherited from muda::LaunchCore
See muda::LaunchCore
| Type | Name |
|---|---|
| ::cudaStream_t | m_stream |
Protected Functions inherited from muda::CubWrapper
See muda::CubWrapper
| Type | Name |
|---|---|
| std::byte * | prepare_buffer (size_t reqSize) |
Protected Functions inherited from muda::LaunchBase
See muda::LaunchBase
| Type | Name |
|---|---|
| T & | pop_kernel_label () |
Protected Functions inherited from muda::LaunchCore
See muda::LaunchCore
| Type | Name |
|---|---|
| MUDA_HOST void | pop_kernel_label () |
| MUDA_GENERIC::cudaStream_t | stream () const |
Public Functions Documentation
function ArgMax [1/3]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMax (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function ArgMax [2/3]
template<typename InputIteratorT, typename OutputIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMax (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_items
)
function ArgMax [3/3]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMax (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function ArgMin [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMin (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function ArgMin [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMin (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Max [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Max (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Max [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Max (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Min [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Min (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Min [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Min (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Reduce [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT, typename ReductionOp, typename T>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Reduce (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets,
ReductionOp reduction_op,
T initial_value
)
function Reduce [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT, typename ReductionOp, typename T>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Reduce (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets,
ReductionOp reduction_op,
T initial_value
)
function Sum [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Sum (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Sum [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Sum (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
The documentation for this class was generated from the following file src/muda/cub/device/device_segmented_reduce.h