|
template<typename KeyIteratorT , typename ValueIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortPairs (KeyIteratorT d_keys, ValueIteratorT d_items, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyInputIteratorT , typename ValueInputIteratorT , typename KeyIteratorT , typename ValueIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortPairsCopy (KeyInputIteratorT d_input_keys, ValueInputIteratorT d_input_items, KeyIteratorT d_output_keys, ValueIteratorT d_output_items, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortKeys (KeyIteratorT d_keys, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyInputIteratorT , typename KeyIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortKeysCopy (KeyInputIteratorT d_input_keys, KeyIteratorT d_output_keys, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyIteratorT , typename ValueIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | StableSortPairs (KeyIteratorT d_keys, ValueIteratorT d_items, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | StableSortKeys (KeyIteratorT d_keys, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyIteratorT , typename ValueIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortPairs (void *d_temp_storage, size_t &temp_storage_bytes, KeyIteratorT d_keys, ValueIteratorT d_items, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyInputIteratorT , typename ValueInputIteratorT , typename KeyIteratorT , typename ValueIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortPairsCopy (void *d_temp_storage, size_t &temp_storage_bytes, KeyInputIteratorT d_input_keys, ValueInputIteratorT d_input_items, KeyIteratorT d_output_keys, ValueIteratorT d_output_items, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortKeys (void *d_temp_storage, size_t &temp_storage_bytes, KeyIteratorT d_keys, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyInputIteratorT , typename KeyIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | SortKeysCopy (void *d_temp_storage, size_t &temp_storage_bytes, KeyInputIteratorT d_input_keys, KeyIteratorT d_output_keys, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyIteratorT , typename ValueIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | StableSortPairs (void *d_temp_storage, size_t &temp_storage_bytes, KeyIteratorT d_keys, ValueIteratorT d_items, OffsetT num_items, CompareOpT compare_op) |
|
template<typename KeyIteratorT , typename OffsetT , typename CompareOpT > |
DeviceMergeSort & | StableSortKeys (void *d_temp_storage, size_t &temp_storage_bytes, KeyIteratorT d_keys, OffsetT num_items, CompareOpT compare_op) |
|
| CubWrapper (Stream &stream=Stream::Default()) |
|
void | kernel_name (std::string_view)=delete |
|
MUDA_GENERIC | LaunchBase (::cudaStream_t stream) MUDA_NOEXCEPT |
|
T & | push_range (const std::string &name) |
|
T & | pop_range () |
|
T & | kernel_name (std::string_view name) |
|
T & | file_line (std::string_view file, int line) |
|
T & | record (cudaEvent_t e, int flag=cudaEventRecordDefault) |
|
T & | record (ComputeGraphVar< cudaEvent_t > &e, const std::vector< ComputeGraphVarBase * > &vars) |
|
template<typename... ViewT> |
T & | record (ComputeGraphVar< cudaEvent_t > &e, ComputeGraphVar< ViewT > &... vars) |
|
T & | when (cudaEvent_t e, int flag=cudaEventWaitDefault) |
|
T & | wait (cudaEvent_t e, int flag=cudaEventWaitDefault) |
|
T & | wait (const ComputeGraphVar< cudaEvent_t > &e, const std::vector< ComputeGraphVarBase * > &vars) |
|
template<typename... ViewT> |
T & | wait (const ComputeGraphVar< cudaEvent_t > &e, ComputeGraphVar< ViewT > &... vars) |
|
T & | wait () |
|
T & | callback (const std::function< void(::cudaStream_t, ::cudaError)> &callback) |
|
template<typename Next > |
Next | next (Next n) |
|
template<typename Next , typename... Args> |
Next | next (Args &&... args) |
|
template<typename T > |
MUDA_GENERIC | LaunchBase (cudaStream_t stream) MUDA_NOEXCEPT |
|
MUDA_GENERIC | LaunchCore (::cudaStream_t stream) MUDA_NOEXCEPT |
|
void | init_stream (::cudaStream_t s) |
|
void | push_range (const std::string &name) |
|
void | pop_range () |
|
void | record (cudaEvent_t e, int flag=cudaEventRecordDefault) |
|
void | record (ComputeGraphVar< cudaEvent_t > &e, const std::vector< ComputeGraphVarBase * > &vars) |
|
template<typename... ViewT> |
void | record (ComputeGraphVar< cudaEvent_t > &e, ComputeGraphVar< ViewT > &... vars) |
|
void | when (cudaEvent_t e, int flag=cudaEventWaitDefault) |
|
void | wait (cudaEvent_t e, int flag=cudaEventWaitDefault) |
|
void | wait (const ComputeGraphVar< cudaEvent_t > &e, const std::vector< ComputeGraphVarBase * > &vars) |
|
template<typename... ViewT> |
void | wait (const ComputeGraphVar< cudaEvent_t > &e, ComputeGraphVar< ViewT > &... vars) |
|
void | wait () |
|
void | callback (const std::function< void(::cudaStream_t, ::cudaError)> &callback) |
|
template<typename... ViewT> |
MUDA_INLINE void | record (ComputeGraphVar< cudaEvent_t > &e, ComputeGraphVar< ViewT > &... vars) |
|
template<typename... ViewT> |
MUDA_INLINE void | wait (const ComputeGraphVar< cudaEvent_t > &e, ComputeGraphVar< ViewT > &... vars) |
|