Class muda::DeviceSegmentedReduce
ClassList > muda > DeviceSegmentedReduce
Inherits the following classes: muda::CubWrapper
Public Types inherited from muda::LaunchBase
See muda::LaunchBase
Type | Name |
---|---|
typedef T | derived_type |
Public Attributes inherited from muda::CubWrapper
See muda::CubWrapper
Type | Name |
---|---|
Stream * | m_muda_stream = = nullptr |
Public Functions
Type | Name |
---|---|
DeviceSegmentedReduce & | ArgMax (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | ArgMax (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_items) |
DeviceSegmentedReduce & | ArgMax (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | ArgMin (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | ArgMin (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | Max (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | Max (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | Min (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | Min (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | Reduce (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets, ReductionOp reduction_op, T initial_value) |
DeviceSegmentedReduce & | Reduce (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets, ReductionOp reduction_op, T initial_value) |
DeviceSegmentedReduce & | Sum (InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
DeviceSegmentedReduce & | Sum (void * d_temp_storage, size_t & temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, int num_segments, BeginOffsetIteratorT d_begin_offsets, EndOffsetIteratorT d_end_offsets) |
Public Functions inherited from muda::CubWrapper
See muda::CubWrapper
Type | Name |
---|---|
CubWrapper (Stream & stream=Stream::Default()) |
|
void | kernel_name (std::string_view) = delete |
Public Functions inherited from muda::LaunchBase
See muda::LaunchBase
Type | Name |
---|---|
MUDA_GENERIC | LaunchBase (::cudaStream_t stream) |
T & | callback (const std::function< void(::cudaStream_t, ::cudaError)> & callback) |
T & | file_line (std::string_view file, int line) |
T & | kernel_name (std::string_view name) |
Next | next (Next n) |
Next | next (Args &&... args) |
T & | pop_range () |
T & | push_range (const std::string & name) |
T & | record (cudaEvent_t e, int flag=cudaEventRecordDefault) |
T & | record (ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
T & | record (ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
T & | wait (cudaEvent_t e, int flag=cudaEventWaitDefault) |
T & | wait (const ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
T & | wait (const ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
T & | wait () |
T & | when (cudaEvent_t e, int flag=cudaEventWaitDefault) |
~LaunchBase () |
Public Functions inherited from muda::LaunchCore
See muda::LaunchCore
Type | Name |
---|---|
MUDA_GENERIC | LaunchCore (::cudaStream_t stream) |
void | callback (const std::function< void(::cudaStream_t, ::cudaError)> & callback) |
void | init_stream (::cudaStream_t s) |
void | pop_range () |
void | push_range (const std::string & name) |
void | record (cudaEvent_t e, int flag=cudaEventRecordDefault) |
void | record (ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
void | record (ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
void | wait (cudaEvent_t e, int flag=cudaEventWaitDefault) |
void | wait (const ComputeGraphVar< cudaEvent_t > & e, const std::vector< ComputeGraphVarBase * > & vars) |
void | wait (const ComputeGraphVar< cudaEvent_t > & e, ComputeGraphVar< ViewT > &... vars) |
void | wait () |
void | when (cudaEvent_t e, int flag=cudaEventWaitDefault) |
~LaunchCore () |
Public Static Functions inherited from muda::LaunchCore
See muda::LaunchCore
Type | Name |
---|---|
void | file_line (std::string_view file, int line) |
void | kernel_name (std::string_view name) |
void | wait_device () |
void | wait_event (cudaEvent_t event) |
void | wait_stream (::cudaStream_t stream) |
Protected Types inherited from muda::LaunchCore
See muda::LaunchCore
Type | Name |
---|---|
typedef std::shared_ptr< T > | S |
Protected Attributes inherited from muda::LaunchCore
See muda::LaunchCore
Type | Name |
---|---|
::cudaStream_t | m_stream |
Protected Functions inherited from muda::CubWrapper
See muda::CubWrapper
Type | Name |
---|---|
std::byte * | prepare_buffer (size_t reqSize) |
Protected Functions inherited from muda::LaunchBase
See muda::LaunchBase
Type | Name |
---|---|
T & | pop_kernel_label () |
Protected Functions inherited from muda::LaunchCore
See muda::LaunchCore
Type | Name |
---|---|
MUDA_HOST void | pop_kernel_label () |
MUDA_GENERIC::cudaStream_t | stream () const |
Public Functions Documentation
function ArgMax [1/3]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMax (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function ArgMax [2/3]
template<typename InputIteratorT, typename OutputIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMax (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_items
)
function ArgMax [3/3]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMax (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function ArgMin [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMin (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function ArgMin [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::ArgMin (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Max [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Max (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Max [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Max (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Min [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Min (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Min [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Min (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Reduce [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT, typename ReductionOp, typename T>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Reduce (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets,
ReductionOp reduction_op,
T initial_value
)
function Reduce [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT, typename ReductionOp, typename T>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Reduce (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets,
ReductionOp reduction_op,
T initial_value
)
function Sum [1/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Sum (
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
function Sum [2/2]
template<typename InputIteratorT, typename OutputIteratorT, typename BeginOffsetIteratorT, typename EndOffsetIteratorT>
inline DeviceSegmentedReduce & muda::DeviceSegmentedReduce::Sum (
void * d_temp_storage,
size_t & temp_storage_bytes,
InputIteratorT d_in,
OutputIteratorT d_out,
int num_segments,
BeginOffsetIteratorT d_begin_offsets,
EndOffsetIteratorT d_end_offsets
)
The documentation for this class was generated from the following file src/muda/cub/device/device_segmented_reduce.h