/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/utility/mxf8_utils.hpp File Reference

/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/utility/mxf8_utils.hpp File Reference#

Composable Kernel: /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/utility/mxf8_utils.hpp File Reference
mxf8_utils.hpp File Reference

Go to the source code of this file.

Namespaces

 ck
 
 ck::fp8_impl
 

Macros

#define CK_MX_FP8_CVT_FAST_PATH   0
 

Functions

template<typename Y , typename X >
__host__ constexpr __device__ Y ck::mxf8_convert_sr (X x, float scale)
 
template<typename Y , typename X >
__host__ constexpr __device__ Y ck::mxf8_convert_rne (X x, float scale)
 
template<>
__host__ __device__ f8_ocp_t ck::mxf8_convert_rne< f8_ocp_t, float > (float x, float scale)
 
template<>
__host__ __device__ bf8_ocp_t ck::mxf8_convert_rne< bf8_ocp_t, float > (float x, float scale)
 
template<>
__host__ __device__ f8x2_ocp_t ck::mxf8_convert_rne< f8x2_ocp_t, float2_t > (float2_t x, float scale)
 
template<>
__host__ __device__ bf8x2_ocp_t ck::mxf8_convert_rne< bf8x2_ocp_t, float2_t > (float2_t x, float scale)
 
template<>
__host__ __device__ f8x16_ocp_t ck::mxf8_convert_rne< f8x16_ocp_t, float16_t > (float16_t x, float scale)
 
template<>
__host__ __device__ bf8x16_ocp_t ck::mxf8_convert_rne< bf8x16_ocp_t, float16_t > (float16_t x, float scale)
 
template<>
__host__ __device__ f8x32_ocp_t ck::mxf8_convert_rne< f8x32_ocp_t, float32_t > (float32_t x, float scale)
 
template<>
__host__ __device__ bf8x32_ocp_t ck::mxf8_convert_rne< bf8x32_ocp_t, float32_t > (float32_t x, float scale)
 
template<>
__host__ __device__ f8_ocp_t ck::mxf8_convert_sr< f8_ocp_t, float > (float x, float scale)
 
template<>
__host__ __device__ bf8_ocp_t ck::mxf8_convert_sr< bf8_ocp_t, float > (float x, float scale)
 
template<>
__host__ __device__ f8x2_ocp_t ck::mxf8_convert_sr< f8x2_ocp_t, float2_t > (float2_t x, float scale)
 
template<>
__host__ __device__ bf8x2_ocp_t ck::mxf8_convert_sr< bf8x2_ocp_t, float2_t > (float2_t x, float scale)
 
template<>
__host__ __device__ f8x16_ocp_t ck::mxf8_convert_sr< f8x16_ocp_t, float16_t > (float16_t x, float scale)
 
template<>
__host__ __device__ bf8x16_ocp_t ck::mxf8_convert_sr< bf8x16_ocp_t, float16_t > (float16_t x, float scale)
 
template<>
__host__ __device__ f8x32_ocp_t ck::mxf8_convert_sr< f8x32_ocp_t, float32_t > (float32_t x, float scale)
 
template<>
__host__ __device__ bf8x32_ocp_t ck::mxf8_convert_sr< bf8x32_ocp_t, float32_t > (float32_t x, float scale)
 

Macro Definition Documentation

◆ CK_MX_FP8_CVT_FAST_PATH

#define CK_MX_FP8_CVT_FAST_PATH   0