/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/tensor_operation/gpu/thread/threadwise_welford.hpp Source File#
threadwise_welford.hpp
Go to the documentation of this file.
Definition: ck.hpp:267
Definition: threadwise_welford.hpp:18
__device__ void Update(T &mean, T &var, T x)
Definition: threadwise_welford.hpp:31
static constexpr auto thread_mean_var_length_m
Definition: threadwise_welford.hpp:24
constexpr __device__ ThreadwiseWelford()
Definition: threadwise_welford.hpp:29
static constexpr auto mean_var_thread_desc_m
Definition: threadwise_welford.hpp:20
static constexpr auto x_thread_desc_m_k
Definition: threadwise_welford.hpp:19
__device__ void Run(const XBufferType &x_buf_m_k, MeanBufferType &mean_buf_m, VarBufferType &var_buf_m)
Definition: threadwise_welford.hpp:51
static constexpr auto thread_x_length_m
Definition: threadwise_welford.hpp:22
static constexpr auto thread_x_length_k
Definition: threadwise_welford.hpp:23
Definition: threadwise_welford.hpp:83
static __device__ void Run(const SrcMeanBufferType &src_mean_buf, const SrcVarBufferType &src_var_buf, const SrcCountBufferType &src_count_buf, DstMeanBufferType &dst_mean_buf, DstVarBufferType &dst_var_buf, DstCountBufferType &dst_count_buf)
Definition: threadwise_welford.hpp:110
static constexpr auto src_length_k
Definition: threadwise_welford.hpp:88
static __device__ void Merge(T &mean_a, T &var_a, int32_t &count_a, T mean_b, T var_b, int32_t count_b)
Definition: threadwise_welford.hpp:94
static constexpr auto dst_thread_desc_m
Definition: threadwise_welford.hpp:85
static constexpr auto dst_length_m
Definition: threadwise_welford.hpp:89
static constexpr auto src_thread_desc_m_k
Definition: threadwise_welford.hpp:84
static constexpr auto src_length_m
Definition: threadwise_welford.hpp:87
Definition: integral_constant.hpp:20
Definition: functional2.hpp:33