include/ck/utility/amd_inline_asm.hpp File Reference

include/ck/utility/amd_inline_asm.hpp File Reference#

Composable Kernel: include/ck/utility/amd_inline_asm.hpp File Reference
amd_inline_asm.hpp File Reference

Go to the source code of this file.

Namespaces

 ck
 

Functions

__device__ int ck::amd_assembly_and_or_b32 (int a, int b, int d)
 
__device__ half2_t ck::amd_assembly_pk_fma_f16 (half2_t a, half2_t b, half2_t c)
 
__device__ half2_t ck::amd_assembly_pk_add_f16 (half2_t a, half2_t b)
 
__device__ void ck::amd_assembly_outer_product_1x2 (float a, float b0, float b1, float &c0, float &c1)
 
__device__ void ck::amd_assembly_outer_product_1x4 (float a, float b0, float b1, float b2, float b3, float &c0, float &c1, float &c2, float &c3)
 
__device__ void ck::amd_assembly_outer_product_1x2 (half2_t a, half2_t b0, half2_t b1, float &c0, float &c1)
 
__device__ void ck::amd_assembly_outer_product_1x4 (half2_t a, half2_t b0, half2_t b1, half2_t b2, half2_t b3, float &c0, float &c1, float &c2, float &c3)
 
__device__ void ck::amd_assembly_outer_product_1x2 (int8x4_t a, int8x4_t b0, int8x4_t b1, int32_t &c0, int32_t &c1)
 
__device__ void ck::amd_assembly_outer_product_1x4 (int8x4_t a, int8x4_t b0, int8x4_t b1, int8x4_t b2, int8x4_t b3, int32_t &c0, int32_t &c1, int32_t &c2, int32_t &c3)