HIP: Heterogenous-computing Interface for Portability
|
struct representing four ocp fp8 numbers with e4m3 interpretation More...
#include <amd_hip_fp8.h>
Public Member Functions | |
__FP8_HOST_DEVICE__ | __hip_fp8x4_e4m3 (const double4 val) |
__FP8_HOST_DEVICE__ | __hip_fp8x4_e4m3 (const float4 val) |
__FP8_HOST_DEVICE__ | __hip_fp8x4_e4m3 (const __hip_bfloat162 low, const __hip_bfloat162 high) |
__FP8_HOST_DEVICE__ | __hip_fp8x4_e4m3 (const __half2 low, const __half2 high) |
__FP8_HOST_DEVICE__ | __hip_fp8x4_e4m3 ()=default |
__FP8_HOST_DEVICE__ | operator float4 () const |
Public Attributes | |
__hip_fp8x4_storage_t | __x |
Static Public Attributes | |
static constexpr __hip_saturation_t | __default_saturation = __HIP_SATFINITE |
raw storage of four fp8 numbers | |
static constexpr __hip_fp8_interpretation_t | __default_interpret = __HIP_E4M3 |
static constexpr unsigned int | __we = 4 |
static constexpr unsigned int | __wm = 3 |
struct representing four ocp fp8 numbers with e4m3 interpretation
|
inline |
create fp8x4 e4m3 type from double4
|
inline |
create fp8x4 e4m3 type from float4
|
inline |
create fp8x4 e4m3 type from two __hip_bfloat162
|
inline |
create fp8x4 e4m3 type from two __half2
|
default |
Default construct fp8x4 e4m3