#include <variants.hpp>
|
__device__ __host__ | StandardAttention ()=default |
|
template<typename Params , typename T > |
__device__ __forceinline__ T | QueryTransform (const Params ¶ms, T q) const |
|
template<typename Params , typename T > |
__device__ __forceinline__ T | LogitsTransform ([[maybe_unused]] const Params ¶ms, T logits, [[maybe_unused]] uint32_t batch_idx, [[maybe_unused]] uint32_t qo_head_idx, [[maybe_unused]] uint32_t kv_head_idx) const |
|
template<typename Params > |
__device__ __forceinline__ bool | LogitsMask (const Params ¶ms, [[maybe_unused]] uint32_t batch_idx, uint32_t qo_idx, uint32_t kv_idx, [[maybe_unused]] uint32_t qo_head_idx, [[maybe_unused]] uint32_t kv_head_idx) const |
|
◆ StandardAttention()
__device__ __host__ ck_tile::StandardAttention::StandardAttention |
( |
| ) |
|
|
default |
◆ LogitsMask()
template<typename Params >
__device__ __forceinline__ bool ck_tile::StandardAttention::LogitsMask |
( |
const Params & |
params, |
|
|
[[maybe_unused] ] uint32_t |
batch_idx, |
|
|
uint32_t |
qo_idx, |
|
|
uint32_t |
kv_idx, |
|
|
[[maybe_unused] ] uint32_t |
qo_head_idx, |
|
|
[[maybe_unused] ] uint32_t |
kv_head_idx |
|
) |
| const |
|
inline |
◆ LogitsTransform()
template<typename Params , typename T >
__device__ __forceinline__ T ck_tile::StandardAttention::LogitsTransform |
( |
[[maybe_unused] ] const Params & |
params, |
|
|
T |
logits, |
|
|
[[maybe_unused] ] uint32_t |
batch_idx, |
|
|
[[maybe_unused] ] uint32_t |
qo_head_idx, |
|
|
[[maybe_unused] ] uint32_t |
kv_head_idx |
|
) |
| const |
|
inline |
NOTICE: For better performance, we simpliy transform thread buffer without calculating qo_idx/kv_idx.
◆ QueryTransform()
template<typename Params , typename T >
__device__ __forceinline__ T ck_tile::StandardAttention::QueryTransform |
( |
const Params & |
params, |
|
|
T |
q |
|
) |
| const |
|
inline |
The documentation for this struct was generated from the following file:
- /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck_tile/ops/fmha/block/variants.hpp