element_wise Namespace Reference

element_wise Namespace Reference#

Composable Kernel: ck_tile::element_wise Namespace Reference
ck_tile::element_wise Namespace Reference

Classes

struct  Add
 
struct  PassThroughPack8
 
struct  DequantPack8
 
struct  PassThroughPack2
 
struct  PassThrough
 
struct  MultiDMultiply
 
struct  MultiDAdd
 
struct  Scale
 
struct  ScaleAndResetNaNToMinusInfinity
 
struct  UnaryDivide
 
struct  UnarySquare
 
struct  UnaryAbs
 
struct  UnarySqrt
 
struct  Relu
 
struct  FastGelu
 
struct  FastGeluAsm
 
struct  Gelu
 
struct  Sigmoid
 
struct  Silu
 
struct  TanH
 
struct  ACos
 
struct  Neg
 
struct  ATan
 
struct  Sin
 
struct  ASinH
 
struct  Cos
 
struct  ACosH
 
struct  Tan
 
struct  ATanH
 
struct  SinH
 
struct  Ceil
 
struct  Exp
 
struct  CosH
 
struct  Floor
 
struct  Log
 
struct  ASin
 
struct  Rcp
 
struct  Swish
 
struct  SoftRelu
 
struct  Power
 
struct  ClippedRelu
 
struct  LeakyRelu
 
struct  Elu
 
struct  Logistic
 
struct  ConvInvscale
 
struct  ConvScale
 
struct  ConvScaleRelu
 
struct  Cast
 

Functions

CK_TILE_DEVICE fp16x4_t i4_to_half4 (int q)
 
CK_TILE_DEVICE fp16x4_t i4_to_half4_scale (int q, const fp16x2_t &scale)
 
CK_TILE_DEVICE bf16x4_t i4_to_bhalf4 (int q)
 
CK_TILE_DEVICE fp8x8_t amd_assembly_i4_to_fp8x8 (int a)
 
CK_TILE_DEVICE float amd_assembly_fp8_to_fp32 (uint32_t src)
 
CK_TILE_DEVICE float amd_assembly_bf8_to_fp32 (uint32_t src)
 
CK_TILE_DEVICE bf8x8_t amd_assembly_i4_to_bf8x8 (int a)
 

Function Documentation

◆ amd_assembly_bf8_to_fp32()

CK_TILE_DEVICE float ck_tile::element_wise::amd_assembly_bf8_to_fp32 ( uint32_t  src)

◆ amd_assembly_fp8_to_fp32()

CK_TILE_DEVICE float ck_tile::element_wise::amd_assembly_fp8_to_fp32 ( uint32_t  src)

◆ amd_assembly_i4_to_bf8x8()

CK_TILE_DEVICE bf8x8_t ck_tile::element_wise::amd_assembly_i4_to_bf8x8 ( int  a)

◆ amd_assembly_i4_to_fp8x8()

CK_TILE_DEVICE fp8x8_t ck_tile::element_wise::amd_assembly_i4_to_fp8x8 ( int  a)

◆ i4_to_bhalf4()

CK_TILE_DEVICE bf16x4_t ck_tile::element_wise::i4_to_bhalf4 ( int  q)

◆ i4_to_half4()

CK_TILE_DEVICE fp16x4_t ck_tile::element_wise::i4_to_half4 ( int  q)

◆ i4_to_half4_scale()

CK_TILE_DEVICE fp16x4_t ck_tile::element_wise::i4_to_half4_scale ( int  q,
const fp16x2_t scale 
)