/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/utility/inner_product.hpp Source File#
inner_product.hpp
Go to the documentation of this file.
76 __device__ void inner_product<bhalf_t, bhalf_t, float>(const bhalf_t& a, const bhalf_t& b, float& c)
88 __device__ void inner_product<half2_t, half2_t, float>(const half2_t& a, const half2_t& b, float& c)
93 // https://www.amd.com/system/files/TechDocs/instinct-mi200-cdna2-instruction-set-architecture.pdf
116 __device__ void inner_product<half4_t, half4_t, float>(const half4_t& a, const half4_t& b, float& c)
131 __device__ void inner_product<half8_t, half8_t, float>(const half8_t& a, const half8_t& b, float& c)
156 __device__ void inner_product<int8_t, int8_t, int32_t>(const int8_t& a, const int8_t& b, int32_t& c)
184 // https://www.amd.com/system/files/TechDocs/instinct-mi200-cdna2-instruction-set-architecture.pdf
226 inner_product<int8x16_t, int8x16_t, int32_t>(const int8x16_t& a, const int8x16_t& b, int32_t& c)
Definition: ck.hpp:267
__device__ void inner_product< half_t, half_t, float >(const half_t &a, const half_t &b, float &c)
Definition: inner_product.hpp:82
__device__ void inner_product< float2_t, float2_t, float >(const float2_t &a, const float2_t &b, float &c)
Definition: inner_product.hpp:35
__device__ void inner_product< int8x2_t, int8x2_t, int32_t >(const int8x2_t &a, const int8x2_t &b, int32_t &c)
Definition: inner_product.hpp:163
__device__ void inner_product< half2_t, half2_t, float >(const half2_t &a, const half2_t &b, float &c)
Definition: inner_product.hpp:88
__device__ void inner_product< float4_t, float4_t, float >(const float4_t &a, const float4_t &b, float &c)
Definition: inner_product.hpp:51
__device__ void inner_product< int8x8_t, int8x8_t, int32_t >(const int8x8_t &a, const int8x8_t &b, int32_t &c)
Definition: inner_product.hpp:210
__device__ void inner_product< half4_t, half4_t, float >(const half4_t &a, const half4_t &b, float &c)
Definition: inner_product.hpp:116
__device__ void inner_product< bhalf_t, bhalf_t, float >(const bhalf_t &a, const bhalf_t &b, float &c)
Definition: inner_product.hpp:76
__device__ void inner_product< int8x16_t, int8x16_t, int32_t >(const int8x16_t &a, const int8x16_t &b, int32_t &c)
Definition: inner_product.hpp:226
__device__ void inner_product< half8_t, half8_t, float >(const half8_t &a, const half8_t &b, float &c)
Definition: inner_product.hpp:131
__device__ void inner_product< int8_t, int8_t, int32_t >(const int8_t &a, const int8_t &b, int32_t &c)
Definition: inner_product.hpp:156
__device__ void inner_product< int8x4_t, int8x4_t, int32_t >(const int8x4_t &a, const int8x4_t &b, int32_t &c)
Definition: inner_product.hpp:179
__device__ void inner_product(const TA &a, const TB &b, TC &c)
__device__ void inner_product< float, float, float >(const float &a, const float &b, float &c)
Definition: inner_product.hpp:14
Definition: integral_constant.hpp:20
Definition: functional2.hpp:33
Definition: dtype_vector.hpp:10