/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck_tile/ops/epilogue/dynamic_quant_epilogue.hpp Source File#
dynamic_quant_epilogue.hpp
Go to the documentation of this file.
Definition: cluster_descriptor.hpp:13
CK_TILE_DEVICE auto tile_elementwise_in(const InElementFunc &in_element_func, const InTensor &... in_dstr_tensors)
Definition: tile_elementwise.hpp:40
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition: type_traits.hpp:21
CK_TILE_DEVICE void buffer_store_fence(index_t cnt=0)
Definition: amd_buffer_addressing.hpp:1000
CK_TILE_DEVICE void store_tile_raw(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: store_tile.hpp:46
constexpr CK_TILE_DEVICE auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition: null_tile_window.hpp:75
constexpr CK_TILE_HOST_DEVICE auto make_tuple(Xs &&... xs)
Definition: tuple.hpp:360
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: store_tile.hpp:23
CK_TILE_DEVICE auto load_tile(const TileWindow_ &tile_window, number< i_access >={}, bool_constant< oob_conditional_check >={})
Definition: load_tile.hpp:22
constexpr CK_TILE_HOST_DEVICE void sweep_tile(const F &f, UnpacksPerXDim={})
Definition: sweep_tile.hpp:231
constexpr CK_TILE_HOST_DEVICE auto make_static_tile_distribution(StaticTileDistributionEncoding_)
Definition: tile_distribution.hpp:480
Definition: block_reduce2d.hpp:200
Definition: block_reduce2d.hpp:45
Definition: block_reduce2d_problem.hpp:12
Definition: block_reduce2d.hpp:135
Definition: dynamic_quant_epilogue.hpp:45
static constexpr bool UseMax3
Definition: dynamic_quant_epilogue.hpp:55
remove_cvref_t< typename Problem::BlockShape > BlockShape
Definition: dynamic_quant_epilogue.hpp:51
remove_cvref_t< typename Problem::YScaleDataType > YScaleDataType
Definition: dynamic_quant_epilogue.hpp:49
remove_cvref_t< typename Problem::ODataType > ODataType
Definition: dynamic_quant_epilogue.hpp:50
static constexpr bool kPadM
Definition: dynamic_quant_epilogue.hpp:52
static constexpr CK_TILE_HOST_DEVICE index_t GetSmemSize()
Definition: dynamic_quant_epilogue.hpp:102
remove_cvref_t< typename Problem::SmoothScaleDataType > SmoothScaleDataType
Definition: dynamic_quant_epilogue.hpp:48
static constexpr CK_TILE_DEVICE auto MakeSmoothInputScaleTileDistribution()
Definition: dynamic_quant_epilogue.hpp:75
CK_TILE_DEVICE auto operator()(ODramWindowTmp &o_dram_window_tmp, YScaleWindow &y_scale_window, const OAccTile &o_acc_tile, void *smem)
Definition: dynamic_quant_epilogue.hpp:204
remove_cvref_t< typename Problem::AccDataType > AccDataType
Definition: dynamic_quant_epilogue.hpp:47
static constexpr CK_TILE_HOST_DEVICE auto GetBlockReduce2dSync()
Definition: dynamic_quant_epilogue.hpp:63
static constexpr bool kPadN
Definition: dynamic_quant_epilogue.hpp:53
static constexpr CK_TILE_HOST_DEVICE auto GetBlockReduce2d()
Definition: dynamic_quant_epilogue.hpp:57
static constexpr bool UseRawStore
Definition: dynamic_quant_epilogue.hpp:54
CK_TILE_DEVICE auto operator()(ODramWindowTmp &o_dram_window_tmp, const SmoothScaleWindow &sm_scale_window_, YScaleWindow &y_scale_window, const OAccTile &o_acc_tile, void *smem)
Definition: dynamic_quant_epilogue.hpp:180
static constexpr CK_TILE_HOST_DEVICE auto GetBlockReduce2dCrossWarpSync()
Definition: dynamic_quant_epilogue.hpp:69
remove_cvref_t< Problem_ > Problem
Definition: dynamic_quant_epilogue.hpp:46
CK_TILE_DEVICE auto Impl(ODramWindowTmp &o_dram_window_tmp, YScaleWindow &y_scale_window, const OAccTile &o_acc_tile, void *smem)
Definition: dynamic_quant_epilogue.hpp:109
Definition: dynamic_quant_epilogue.hpp:33
remove_cvref_t< YScaleDataType_ > YScaleDataType
Definition: dynamic_quant_epilogue.hpp:36
remove_cvref_t< ODataType_ > ODataType
Definition: dynamic_quant_epilogue.hpp:37
remove_cvref_t< Traits_ > Traits
Definition: dynamic_quant_epilogue.hpp:39
remove_cvref_t< BlockShape_ > BlockShape
Definition: dynamic_quant_epilogue.hpp:38
remove_cvref_t< SmoothScaleDataType_ > SmoothScaleDataType
Definition: dynamic_quant_epilogue.hpp:35
remove_cvref_t< AccDataType_ > AccDataType
Definition: dynamic_quant_epilogue.hpp:34
Definition: dynamic_quant_epilogue.hpp:17
static constexpr bool kPadM
Definition: dynamic_quant_epilogue.hpp:18
static constexpr bool UseRawStore
Definition: dynamic_quant_epilogue.hpp:21
static constexpr bool kPadN
Definition: dynamic_quant_epilogue.hpp:19
static constexpr bool UseSmoothInputScale
Definition: dynamic_quant_epilogue.hpp:20
static constexpr bool UseMax3
Definition: dynamic_quant_epilogue.hpp:22
Definition: integral_constant.hpp:13
Definition: numeric.hpp:18
Definition: sequence.hpp:49
Definition: tile_distribution_encoding.hpp:26
Definition: tuple.hpp:192