mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 23:03:52 +08:00
[ROCm][Quantization][Kernel] Use FP8 FNUZ when OCP flag is 0 or undefined (#13851)
Signed-off-by: Hollow Man <hollowman@opensuse.org>
This commit is contained in:
@ -24,12 +24,12 @@ __inline__ __device__ Tout scaled_vec_conversion(const Tin& x,
|
|||||||
return x;
|
return x;
|
||||||
}
|
}
|
||||||
|
|
||||||
#if HIP_FP8_TYPE_FNUZ
|
#if HIP_FP8_TYPE_OCP
|
||||||
using fp8_type = __hip_fp8_e4m3_fnuz;
|
|
||||||
using fp8x2_type = __hip_fp8x2_e4m3_fnuz;
|
|
||||||
#elif HIP_FP8_TYPE_OCP
|
|
||||||
using fp8_type = __hip_fp8_e4m3;
|
using fp8_type = __hip_fp8_e4m3;
|
||||||
using fp8x2_type = __hip_fp8x2_e4m3;
|
using fp8x2_type = __hip_fp8x2_e4m3;
|
||||||
|
#else
|
||||||
|
using fp8_type = __hip_fp8_e4m3_fnuz;
|
||||||
|
using fp8x2_type = __hip_fp8x2_e4m3_fnuz;
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// fp8 -> half
|
// fp8 -> half
|
||||||
|
Reference in New Issue
Block a user