@@ -87,7 +87,7 @@ def __init__(
8787 )
8888 self .use_fp8 = (isinstance (quant_config , Fp8Config ) or
8989 (isinstance (quant_config , QuarkConfig )
90- and quant_config ._is_fp8_w8a8 )
90+ and quant_config .is_fp8_w8a8 () )
9191 if current_platform .is_rocm () and not is_navi () else
9292 False )
9393 if hidden_act != "silu" :
@@ -201,7 +201,7 @@ def __init__(self,
201201 # For CUDA devices and Navi4x, attn_fp8 will be set to false.
202202 use_fp8 = isinstance (
203203 quant_config , Fp8Config ) or (isinstance (quant_config , QuarkConfig )
204- and quant_config ._is_fp8_w8a8 )
204+ and quant_config .is_fp8_w8a8 () )
205205 self .attn_fp8_out = envs .VLLM_USE_ROCM_CUSTOM_PAGED_ATTN_FP8_OUT \
206206 and current_platform .is_rocm () \
207207 and not is_navi () \
@@ -248,7 +248,7 @@ def __init__(
248248 self .hidden_size = config .hidden_size
249249 self .use_fp8 = (isinstance (quant_config , Fp8Config ) or
250250 (isinstance (quant_config , QuarkConfig )
251- and quant_config ._is_fp8_w8a8 )
251+ and quant_config .is_fp8_w8a8 () )
252252 if current_platform .is_rocm () and not is_navi () else
253253 False )
254254 rope_theta = getattr (config , "rope_theta" , 10000 )
0 commit comments