/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/tensor_operation/gpu/grid/gridwise_gemm_xdl_cshuffle_v3_mx.hpp File Reference#
gridwise_gemm_xdl_cshuffle_v3_mx.hpp File Reference
#include "ck/tensor_description/multi_index_transform_helper.hpp"
#include "ck/tensor_description/tensor_descriptor.hpp"
#include "ck/tensor_description/tensor_descriptor_helper.hpp"
#include "ck/tensor_operation/gpu/block/blockwise_gemm_pipeline_xdlops_mx_selector.hpp"
#include "ck/tensor_operation/gpu/block/thread_group_tensor_slice_transfer_v4r1.hpp"
#include "ck/tensor_operation/gpu/block/thread_group_tensor_slice_transfer_v6r1.hpp"
#include "ck/tensor_operation/gpu/element/element_wise_operation.hpp"
#include "ck/tensor_operation/gpu/grid/block_to_ctile_map.hpp"
#include "ck/tensor_operation/gpu/thread/threadwise_tensor_slice_transfer.hpp"
#include "ck/utility/common_header.hpp"
#include "ck/utility/env.hpp"
#include "ck/tensor_operation/gpu/block/thread_group_tensor_slice_transfer_direct_load.hpp"
Go to the source code of this file.
Namespaces | |
ck | |
Macros | |
#define | KERNEL_GEMM_XDL_CSHUFFLE_V3_MX |
Functions | |
template<bool Use2LDS, typename GridwiseGemm , bool HasMainKBlockLoop, InMemoryDataOperationEnum CGlobalMemoryDataOperation, index_t MinimumOccupancy = 1, TailNumber TailNum = TailNumber::Full> | |
__global__ enable_if_t<!Use2LDS, void > | ck::kernel_gemm_xdl_cshuffle_v3_mx (typename GridwiseGemm::Argument karg) |
template<bool Use2LDS, typename GridwiseGemm , bool HasMainKBlockLoop, InMemoryDataOperationEnum CGlobalMemoryDataOperation, index_t MinimumOccupancy = 1, TailNumber TailNum = TailNumber::Full> | |
__global__ enable_if_t< Use2LDS, void > | ck::kernel_gemm_xdl_cshuffle_v3_mx (typename GridwiseGemm::Argument karg) |
Macro Definition Documentation
◆ KERNEL_GEMM_XDL_CSHUFFLE_V3_MX
#define KERNEL_GEMM_XDL_CSHUFFLE_V3_MX |