element_wise Namespace Reference#
Classes | |
struct | Add |
struct | PassThroughPack8 |
struct | DequantPack8 |
struct | PassThroughPack2 |
struct | PassThrough |
struct | MultiDMultiply |
struct | MultiDAdd |
struct | Scale |
struct | ScaleAndResetNaNToMinusInfinity |
struct | UnaryDivide |
struct | UnarySquare |
struct | UnaryAbs |
struct | UnarySqrt |
struct | Relu |
struct | FastGelu |
struct | FastGeluAsm |
struct | Gelu |
struct | Sigmoid |
struct | Silu |
struct | TanH |
struct | ACos |
struct | Neg |
struct | ATan |
struct | Sin |
struct | ASinH |
struct | Cos |
struct | ACosH |
struct | Tan |
struct | ATanH |
struct | SinH |
struct | Ceil |
struct | Exp |
struct | CosH |
struct | Floor |
struct | Log |
struct | ASin |
struct | Rcp |
struct | Swish |
struct | SoftRelu |
struct | Power |
struct | ClippedRelu |
struct | LeakyRelu |
struct | Elu |
struct | Logistic |
struct | ConvInvscale |
struct | ConvScale |
struct | ConvScaleRelu |
struct | Cast |
Functions | |
CK_TILE_DEVICE fp16x4_t | i4_to_half4 (int q) |
CK_TILE_DEVICE fp16x4_t | i4_to_half4_scale (int q, const fp16x2_t &scale) |
CK_TILE_DEVICE bf16x4_t | i4_to_bhalf4 (int q) |
CK_TILE_DEVICE fp8x8_t | amd_assembly_i4_to_fp8x8 (int a) |
CK_TILE_DEVICE float | amd_assembly_fp8_to_fp32 (uint32_t src) |
CK_TILE_DEVICE float | amd_assembly_bf8_to_fp32 (uint32_t src) |
CK_TILE_DEVICE bf8x8_t | amd_assembly_i4_to_bf8x8 (int a) |
Function Documentation
◆ amd_assembly_bf8_to_fp32()
CK_TILE_DEVICE float ck_tile::element_wise::amd_assembly_bf8_to_fp32 | ( | uint32_t | src | ) |
◆ amd_assembly_fp8_to_fp32()
CK_TILE_DEVICE float ck_tile::element_wise::amd_assembly_fp8_to_fp32 | ( | uint32_t | src | ) |
◆ amd_assembly_i4_to_bf8x8()
CK_TILE_DEVICE bf8x8_t ck_tile::element_wise::amd_assembly_i4_to_bf8x8 | ( | int | a | ) |
◆ amd_assembly_i4_to_fp8x8()
CK_TILE_DEVICE fp8x8_t ck_tile::element_wise::amd_assembly_i4_to_fp8x8 | ( | int | a | ) |
◆ i4_to_bhalf4()
CK_TILE_DEVICE bf16x4_t ck_tile::element_wise::i4_to_bhalf4 | ( | int | q | ) |
◆ i4_to_half4()
CK_TILE_DEVICE fp16x4_t ck_tile::element_wise::i4_to_half4 | ( | int | q | ) |
◆ i4_to_half4_scale()
CK_TILE_DEVICE fp16x4_t ck_tile::element_wise::i4_to_half4_scale | ( | int | q, |
const fp16x2_t & | scale | ||
) |