/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck_tile/ops/grouped_convolution/utils/grouped_convolution_utils.hpp Source File#
grouped_convolution_utils.hpp
Go to the documentation of this file.
50 using GroupedConvFwdHostArgs = GroupedConvHostArgs<const void*, const void*, void*, CDElementwise>;
Definition: cluster_descriptor.hpp:13
ConvolutionSpecialization
Definition: convolution_specialization.hpp:11
ck_tile::element_wise::PassThrough PassThrough
Definition: grouped_convolution_utils.hpp:47
CK_TILE_HOST SplitImagePieceInfo calculate_spatial_piece(ck_tile::index_t piece_idx, ck_tile::index_t num_d_pieces, ck_tile::index_t num_h_pieces, ck_tile::index_t num_w_pieces, ck_tile::index_t base_piece_d, ck_tile::index_t base_piece_h, ck_tile::index_t base_piece_w, ck_tile::index_t total_d, ck_tile::index_t total_h, ck_tile::index_t total_w, ck_tile::index_t N, ck_tile::index_t K, ck_tile::index_t total_blocks)
Calculate piece information for split-image convolution.
Definition: grouped_convolution_utils.hpp:150
constexpr CK_TILE_HOST_DEVICE auto generate_tuple(F &&f, number< N >)
Definition: tuple.hpp:429
The Grouped Conv kernel host arguments.
Definition: grouped_convolution_utils.hpp:20
const std::vector< const void * > ds_ptr
Definition: grouped_convolution_utils.hpp:41
const CDElementwise elfunc
Definition: grouped_convolution_utils.hpp:44
CK_TILE_HOST GroupedConvHostArgs()=delete
CK_TILE_HOST GroupedConvHostArgs(ConvParam conv_param, InPtr in_ptr_, WeiPtr wei_ptr_, const std::vector< const void * > ds_ptr_, OutPtr out_ptr_, index_t k_batch_, CDElementwise elfunc_=CDElementwise{})
Definition: grouped_convolution_utils.hpp:22
Definition: grouped_convolution_utils.hpp:68
static constexpr index_t NumDTensor
Definition: grouped_convolution_utils.hpp:109
static constexpr ck_tile::index_t VectorSizeB
Definition: grouped_convolution_utils.hpp:107
OutLayout_ OutLayout
Definition: grouped_convolution_utils.hpp:83
static constexpr index_t NumGroupsToMerge
Definition: grouped_convolution_utils.hpp:77
static constexpr ck_tile::index_t VectorSizeC
Definition: grouped_convolution_utils.hpp:108
static constexpr ConvolutionSpecialization ConvSpecialization
Definition: grouped_convolution_utils.hpp:79
static constexpr index_t NDimSpatial
Definition: grouped_convolution_utils.hpp:78
decltype(generate_implicit_gemm_layout()) ImplicitGemmDsLayout
Definition: grouped_convolution_utils.hpp:110
WeiLayout_ WeiLayout
Definition: grouped_convolution_utils.hpp:81
static constexpr ck_tile::index_t VectorSizeA
Definition: grouped_convolution_utils.hpp:106
CDElementwise_ CDElementwise
Definition: grouped_convolution_utils.hpp:84
Helper struct for split-image piece information.
Definition: grouped_convolution_utils.hpp:119
ck_tile::index_t block_end
GPU block range for this piece.
Definition: grouped_convolution_utils.hpp:120
ck_tile::index_t d_size
Definition: grouped_convolution_utils.hpp:122
ck_tile::index_t d_start
Definition: grouped_convolution_utils.hpp:121
ck_tile::index_t w_start
Spatial start coordinates (output space)
Definition: grouped_convolution_utils.hpp:121
ck_tile::index_t h_size
Definition: grouped_convolution_utils.hpp:122
ck_tile::index_t h_start
Definition: grouped_convolution_utils.hpp:121
ck_tile::index_t w_size
Spatial dimensions of this piece.
Definition: grouped_convolution_utils.hpp:122
ck_tile::index_t block_start
Definition: grouped_convolution_utils.hpp:120
Definition: tile_gemm_traits.hpp:18
Definition: integral_constant.hpp:13
Definition: convolution_parameter.hpp:15
ConvParam(ck_tile::index_t n_dim, ck_tile::index_t group_count, ck_tile::index_t n_batch, ck_tile::index_t n_out_channels, ck_tile::index_t n_in_channels, const std::vector< ck_tile::index_t > &filters_len, const std::vector< ck_tile::index_t > &input_len, const std::vector< ck_tile::index_t > &strides, const std::vector< ck_tile::index_t > &dilations, const std::vector< ck_tile::index_t > &left_pads, const std::vector< ck_tile::index_t > &right_pads)
Definition: convolution_parameter.hpp:16
Definition: unary_element_wise_operation.hpp:437
Definition: tensor_layout.hpp:22
Definition: tensor_layout.hpp:17