#include <thread_group_tensor_slice_transfer_global.hpp>
|
| __device__ | ThreadGroupTransferGlobal (const SrcDesc &src_desc, const DstDesc &dst_desc, const Index &src_block_slice_origin, const Index &dst_block_slice_origin, const ElementwiseOperation &element_op) |
| |
| template<typename GridBufferType > |
| __device__ void | RunRead (const SrcDesc &src_desc, const GridBufferType &grid_buf) |
| |
| template<typename BlockBufferType > |
| __device__ void | RunWrite (const DstDesc &dst_desc, BlockBufferType &dst_buf) |
| |
| __device__ void | MoveSrcSliceWindow (const SrcDesc &src_desc, const Index &step) |
| |
◆ DstCoord
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| using ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::DstCoord = decltype(make_tensor_coordinate(DstDesc{}, Index{})) |
◆ Index
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
◆ SrcCoord
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| using ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::SrcCoord = decltype(make_tensor_coordinate(SrcDesc{}, Index{})) |
◆ ThreadGroupTransferGlobal()
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| __device__ ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::ThreadGroupTransferGlobal |
( |
const SrcDesc & |
src_desc, |
|
|
const DstDesc & |
dst_desc, |
|
|
const Index & |
src_block_slice_origin, |
|
|
const Index & |
dst_block_slice_origin, |
|
|
const ElementwiseOperation & |
element_op |
|
) |
| |
|
inline |
◆ MoveSrcSliceWindow()
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| __device__ void ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::MoveSrcSliceWindow |
( |
const SrcDesc & |
src_desc, |
|
|
const Index & |
step |
|
) |
| |
|
inline |
◆ RunRead()
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
template<typename GridBufferType >
| __device__ void ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::RunRead |
( |
const SrcDesc & |
src_desc, |
|
|
const GridBufferType & |
grid_buf |
|
) |
| |
|
inline |
◆ RunWrite()
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
template<typename BlockBufferType >
| __device__ void ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::RunWrite |
( |
const DstDesc & |
dst_desc, |
|
|
BlockBufferType & |
dst_buf |
|
) |
| |
|
inline |
◆ I0
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| constexpr auto ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::I0 = Number<0>{} |
|
staticconstexpr |
◆ I1
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| constexpr auto ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::I1 = Number<1>{} |
|
staticconstexpr |
◆ I2
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| constexpr auto ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::I2 = Number<2>{} |
|
staticconstexpr |
◆ I3
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| constexpr auto ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::I3 = Number<3>{} |
|
staticconstexpr |
◆ I4
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| constexpr auto ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::I4 = Number<4>{} |
|
staticconstexpr |
◆ I5
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| constexpr auto ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::I5 = Number<5>{} |
|
staticconstexpr |
◆ I6
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
| constexpr auto ck::ThreadGroupTransferGlobal< SrcDesc, DstDesc, SrcData, DstData, ElementwiseOperation, NumberOfIterations, StepsPerIteration, IterationOrder, VectorSize, DoTranspose >::I6 = Number<6>{} |
|
staticconstexpr |
◆ nDim
template<typename SrcDesc , typename DstDesc , typename SrcData , typename DstData , typename ElementwiseOperation , typename NumberOfIterations , typename StepsPerIteration , typename IterationOrder , index_t VectorSize, bool DoTranspose>
The documentation for this struct was generated from the following file: