#include <block_reduce2d.hpp>
|
| CK_TILE_DEVICE constexpr | BlockReduce2d () |
| template<typename XDistributedTensor_, typename YDistributedTensor_, typename ReduceFunc, typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>> |
| CK_TILE_DEVICE void | operator() (const XDistributedTensor_ &x_tensor, YDistributedTensor_ &y_tensor, const ReduceFunc &reduce_func, ReducePacksPerXDim={}) |
| template<typename XDistributedTensor_, typename YDistributedTensor_, typename YIndexDistributedTensor_, typename ReduceFunc, typename IndexCalculatorFunc, typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>> |
| CK_TILE_DEVICE void | operator() (const XDistributedTensor_ &x_tensor, YDistributedTensor_ &y_tensor, YIndexDistributedTensor_ &y_index_tensor, const ReduceFunc &reduce_func, const IndexCalculatorFunc &index_calculator, ReducePacksPerXDim={}) |
| template<typename XDistributedTensor_, typename ReduceFunc, typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>> |
| CK_TILE_DEVICE auto | operator() (const XDistributedTensor_ &x_tensor, const ComputeDataType &reduce_init, const ReduceFunc &reduce_func, ReducePacksPerXDim={}) |
◆ ComputeDataType
template<typename Problem_, typename Policy_ = void>
◆ Problem
template<typename Problem_, typename Policy_ = void>
◆ XDataType
template<typename Problem_, typename Policy_ = void>
◆ BlockReduce2d()
template<typename Problem_, typename Policy_ = void>
◆ MakeYBlockTile()
template<typename Problem_, typename Policy_ = void>
template<typename XDistributedTensor_>
◆ MakeYIndexBlockTile()
template<typename Problem_, typename Policy_ = void>
template<typename XDistributedTensor_, typename IndexDataType = index_t>
◆ operator()() [1/3]
template<typename Problem_, typename Policy_ = void>
template<typename XDistributedTensor_, typename ReduceFunc, typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>>
◆ operator()() [2/3]
template<typename Problem_, typename Policy_ = void>
template<typename XDistributedTensor_, typename YDistributedTensor_, typename ReduceFunc, typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>>
| CK_TILE_DEVICE void ck_tile::BlockReduce2d< Problem_, Policy_ >::operator() |
( |
const XDistributedTensor_ & | x_tensor, |
|
|
YDistributedTensor_ & | y_tensor, |
|
|
const ReduceFunc & | reduce_func, |
|
|
ReducePacksPerXDim | = {} ) |
|
inline |
◆ operator()() [3/3]
template<typename Problem_, typename Policy_ = void>
template<typename XDistributedTensor_, typename YDistributedTensor_, typename YIndexDistributedTensor_, typename ReduceFunc, typename IndexCalculatorFunc, typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>>
| CK_TILE_DEVICE void ck_tile::BlockReduce2d< Problem_, Policy_ >::operator() |
( |
const XDistributedTensor_ & | x_tensor, |
|
|
YDistributedTensor_ & | y_tensor, |
|
|
YIndexDistributedTensor_ & | y_index_tensor, |
|
|
const ReduceFunc & | reduce_func, |
|
|
const IndexCalculatorFunc & | index_calculator, |
|
|
ReducePacksPerXDim | = {} ) |
|
inline |
The documentation for this struct was generated from the following file: