include/ck/utility/amd_inline_asm.hpp File Reference#
amd_inline_asm.hpp File Reference
Go to the source code of this file.
Namespaces | |
ck | |
Functions | |
__device__ int | ck::amd_assembly_and_or_b32 (int a, int b, int d) |
__device__ half2_t | ck::amd_assembly_pk_fma_f16 (half2_t a, half2_t b, half2_t c) |
__device__ half2_t | ck::amd_assembly_pk_add_f16 (half2_t a, half2_t b) |
__device__ void | ck::amd_assembly_outer_product_1x2 (float a, float b0, float b1, float &c0, float &c1) |
__device__ void | ck::amd_assembly_outer_product_1x4 (float a, float b0, float b1, float b2, float b3, float &c0, float &c1, float &c2, float &c3) |
__device__ void | ck::amd_assembly_outer_product_1x2 (half2_t a, half2_t b0, half2_t b1, float &c0, float &c1) |
__device__ void | ck::amd_assembly_outer_product_1x4 (half2_t a, half2_t b0, half2_t b1, half2_t b2, half2_t b3, float &c0, float &c1, float &c2, float &c3) |
__device__ void | ck::amd_assembly_outer_product_1x2 (int8x4_t a, int8x4_t b0, int8x4_t b1, int32_t &c0, int32_t &c1) |
__device__ void | ck::amd_assembly_outer_product_1x4 (int8x4_t a, int8x4_t b0, int8x4_t b1, int8x4_t b2, int8x4_t b3, int32_t &c0, int32_t &c1, int32_t &c2, int32_t &c3) |