/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/utility/amd_inline_asm.hpp File Reference

/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/utility/amd_inline_asm.hpp File Reference#

Composable Kernel: /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/utility/amd_inline_asm.hpp File Reference
amd_inline_asm.hpp File Reference

Go to the source code of this file.

Namespaces

 ck
 

Functions

__device__ int ck::amd_assembly_and_b32 (int a, int b)
 
__device__ int ck::amd_assembly_and_or_b32 (int a, int b, int d)
 
__device__ half2_t ck::amd_assembly_pk_fma_f16 (half2_t a, half2_t b, half2_t c)
 
__device__ half2_t ck::amd_assembly_pk_add_f16 (half2_t a, half2_t b)
 
__device__ float ck::amd_assemble_cvt_f32_i4 (int b)
 
__device__ f8x4_t ck::amd_assembly_cvt_f8_to_f32 (float b0, float b1, float b2, float b3)
 
__device__ f8x8_t ck::amd_assembly_i4_to_fp8x8 (int a)
 
__device__ void ck::amd_assembly_outer_product_1x2 (float a, float b0, float b1, float &c0, float &c1)
 
__device__ void ck::amd_assembly_outer_product_1x4 (float a, float b0, float b1, float b2, float b3, float &c0, float &c1, float &c2, float &c3)
 
__device__ void ck::amd_assembly_outer_product_1x2 (half2_t a, half2_t b0, half2_t b1, float &c0, float &c1)
 
__device__ void ck::amd_assembly_outer_product_1x4 (half2_t a, half2_t b0, half2_t b1, half2_t b2, half2_t b3, float &c0, float &c1, float &c2, float &c3)
 
__device__ void ck::amd_assembly_outer_product_1x2 (int8x4_t a, int8x4_t b0, int8x4_t b1, int32_t &c0, int32_t &c1)
 
__device__ void ck::amd_assembly_outer_product_1x4 (int8x4_t a, int8x4_t b0, int8x4_t b1, int8x4_t b2, int8x4_t b3, int32_t &c0, int32_t &c1, int32_t &c2, int32_t &c3)