include/ck_tile/ops/epilogue/cshuffle_epilogue.hpp Source File#
cshuffle_epilogue.hpp
Go to the documentation of this file.
Definition: cluster_descriptor.hpp:13
constexpr CK_TILE_HOST_DEVICE auto make_naive_tensor_descriptor(const tuple< Lengths... > &lengths, const tuple< Strides... > &strides, number< GuaranteedLastDimensionVectorLength >=number<-1 >{}, number< GuaranteedLastDimensionVectorStride >=number<-1 >{})
Definition: tensor_descriptor.hpp:255
typename impl::WarpGemmMfmaDispatcher< AType, BType, CType, MPerWave, NPerWave, KPerWave, TransposeC, SwizzleA >::Type WarpGemmMfmaDispatcher
Definition: warp_gemm_dispatcher.hpp:81
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition: type_traits.hpp:20
CK_TILE_DEVICE auto load_tile(const tile_window_with_static_distribution< BottomTensorView_, WindowLengths_, TileDistribution_, NumCoord > &tile_window, number< i_access >={}, bool_constant< oob_conditional_check >={})
Definition: load_tile.hpp:27
constexpr CK_TILE_HOST_DEVICE auto to_sequence(tuple< number< Is >... >)
Definition: sequence.hpp:1046
constexpr CK_TILE_HOST_DEVICE auto merge_sequences(Seqs...)
Definition: sequence.hpp:817
constexpr CK_TILE_DEVICE auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition: null_tile_window.hpp:72
CK_TILE_DEVICE void move_tile_window(null_tile_window< WindowLengths > &, const typename null_tile_window< WindowLengths >::BottomTensorIndex &)
Definition: null_tile_window.hpp:92
constexpr CK_TILE_HOST_DEVICE auto make_tuple(Xs &&... xs)
Definition: tuple.hpp:337
CK_TILE_DEVICE void update_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: update_tile.hpp:22
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: store_tile.hpp:23
typename uniform_sequence_gen< NSize, I >::type uniform_sequence_gen_t
Definition: sequence.hpp:1017
Definition: cshuffle_epilogue.hpp:42
static constexpr index_t kBlockSize
Definition: cshuffle_epilogue.hpp:47
static constexpr CK_TILE_HOST_DEVICE auto MakeLdsBlockDescriptor()
Definition: cshuffle_epilogue.hpp:88
typename WG::CWarpTensor CWarpTensor
Definition: cshuffle_epilogue.hpp:68
WarpGemmMfmaDispatcher< ODataType, ODataType, AccDataType, kMPerXdl, kNPerXdl, kKPerXdl, isCTransposed > WG
Definition: cshuffle_epilogue.hpp:65
static constexpr index_t kKPerXdl
Definition: cshuffle_epilogue.hpp:54
remove_cvref_t< Problem_ > Problem
Definition: cshuffle_epilogue.hpp:43
remove_cvref_t< typename Problem::ODataType > ODataType
Definition: cshuffle_epilogue.hpp:45
static constexpr index_t kNPerBlock
Definition: cshuffle_epilogue.hpp:49
static constexpr index_t kMPerIteration
Definition: cshuffle_epilogue.hpp:56
static constexpr index_t kMPerXdl
Definition: cshuffle_epilogue.hpp:52
remove_cvref_t< typename Problem::CLayout > CLayout
Definition: cshuffle_epilogue.hpp:46
static constexpr index_t isCTransposed
Definition: cshuffle_epilogue.hpp:55
static constexpr CK_TILE_HOST_DEVICE index_t GetSmemSize()
Definition: cshuffle_epilogue.hpp:110
static constexpr index_t kNWave
Definition: cshuffle_epilogue.hpp:51
static constexpr CK_TILE_HOST_DEVICE auto GetVectorSizeC()
Get the vector store size for C tensor.
Definition: cshuffle_epilogue.hpp:81
remove_cvref_t< typename Problem::AccDataType > AccDataType
Definition: cshuffle_epilogue.hpp:44
static constexpr index_t kNPerIteration
Definition: cshuffle_epilogue.hpp:57
static constexpr index_t kMPerBlock
Definition: cshuffle_epilogue.hpp:48
typename WG::CWarpDstr CWarpDstr
Definition: cshuffle_epilogue.hpp:67
CK_TILE_DEVICE auto operator()(ODramWindow &out_dram_window, const OAccTile &o_acc_tile, void *p_smem)
Definition: cshuffle_epilogue.hpp:119
static constexpr index_t kMWave
Definition: cshuffle_epilogue.hpp:50
static constexpr index_t kNPerXdl
Definition: cshuffle_epilogue.hpp:53
Definition: cshuffle_epilogue.hpp:25
static constexpr index_t kNWave
Definition: cshuffle_epilogue.hpp:33
static constexpr index_t isCTransposed
Definition: cshuffle_epilogue.hpp:37
static constexpr index_t kMPerBlock
Definition: cshuffle_epilogue.hpp:30
static constexpr index_t kMPerXdl
Definition: cshuffle_epilogue.hpp:34
remove_cvref_t< CLayout_ > CLayout
Definition: cshuffle_epilogue.hpp:28
static constexpr index_t kNPerXdl
Definition: cshuffle_epilogue.hpp:35
remove_cvref_t< AccDataType_ > AccDataType
Definition: cshuffle_epilogue.hpp:26
static constexpr index_t kKPerXdl
Definition: cshuffle_epilogue.hpp:36
static constexpr index_t kBlockSize
Definition: cshuffle_epilogue.hpp:29
remove_cvref_t< ODataType_ > ODataType
Definition: cshuffle_epilogue.hpp:27
static constexpr index_t kMWave
Definition: cshuffle_epilogue.hpp:32
static constexpr index_t kNPerBlock
Definition: cshuffle_epilogue.hpp:31
Class creating 2D static tile distribution with different load/store patterns.
Definition: static_encoding_pattern.hpp:61
Definition: integral_constant.hpp:13
Definition: sequence.hpp:52
Definition: space_filling_curve.hpp:20
Definition: functional.hpp:43