#include <reduce2d_kernel.hpp>
|
template<typename InputShape , typename InputStrides , typename KeptDim , typename ReduceDims > |
CK_TILE_DEVICE void | operator() (const XDataType *p_x, YDataType *p_y, InputShape input_shape, InputStrides input_strides, KeptDim kept_dim, ReduceDims reduce_dims) const |
|
◆ ComputeDataType
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
◆ Policy
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
◆ Problem
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
◆ XDataType
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
◆ YDataType
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
◆ BlockSize()
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
◆ IsSupportedArgument()
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
template<typename InputStrides >
Validates if the given arguments are supported by the 2D reduction kernel.
- Parameters
-
y_continous_dim | Size of the continuous dimension of the output tensor. Must be a multiple of ThreadTile_N for proper thread mapping. |
input_strides | The stride configuration of the input tensor. The last stride must be 1 to ensure contiguous memory access and enable efficient vectorized loads. |
- Returns
- true if the arguments are supported, false otherwise. Error messages are logged when CK_TILE_LOGGING is enabled.
- Note
- Requirements:
- y_continous_dim % ThreadTile_N == 0 (for proper thread distribution)
- input_strides[-1] == 1 (for contiguous memory access)
◆ operator()()
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
template<typename InputShape , typename InputStrides , typename KeptDim , typename ReduceDims >
◆ kBlockSize
template<typename Problem_ , typename Policy_ = Reduce2dDefaultPolicy>
The documentation for this struct was generated from the following file:
- /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck_tile/ops/reduce/kernel/reduce2d_kernel.hpp