polish

PaddlePaddle · ZHUI · Dec 3, 2024 · Nov 17, 2024 · Nov 26, 2024 · Nov 26, 2024
commit 1e89250ebe8d08cf4efcab6ea5ba8f78a9ad7604
diff --git a/llm/predict/predictor.py b/llm/predict/predictor.py
@@ -58,12 +58,10 @@
 )
 
 
-def get_attention_type(*args):
-    """
-    It must be passed in the follow order.
-    (block_attn)
-    """
+def get_attention_type(predictor_args):
     count = 0
+    # It must follow this order
+    args = predictor_args.block_attn
     res = []
     for attn_type in args:
         if attn_type:
@@ -73,10 +71,7 @@ def get_attention_type(*args):
             res.append(False)
     if count > 1:
         raise ValueError("Only one attention type can be used")
-    try:
-        return ATTENTION_TYPE_FOR_PREDICTOR_MAPPING_NAMES[tuple(res)]
-    except KeyError:
-        raise ValueError("Unknown attention type")
+    return ATTENTION_TYPE_FOR_PREDICTOR_MAPPING_NAMES[tuple(res)]
 
 
 @dataclass
@@ -1315,7 +1310,7 @@ def create_predictor(
         # infer/ no infer
         if predictor_args.inference_model:
             # block/no block
-            attn_type = get_attention_type(predictor_args.block_attn)
+            attn_type = get_attention_type(predictor_args)
             inference_mode = f"{attn_type}Inference"
 
             if predictor_args.mode == "static":

diff --git a/paddlenlp/transformers/auto/modeling.py b/paddlenlp/transformers/auto/modeling.py
@@ -170,12 +170,10 @@
 )
 
 
-def get_attention_type(*args):
-    """
-    It must be passed in the follow order.
-    (block_attn, speculate_attn)
-    """
+def get_attention_type(predictor_args):
     count = 0
+    # It must follow this order
+    args = (predictor_args.block_attn, predictor_args.speculate_attn)
     res = []
     for attn_type in args:
         if attn_type:
@@ -185,10 +183,7 @@ def get_attention_type(*args):
             res.append(False)
     if count > 1:
         raise ValueError("Only one attention type can be True")
-    try:
-        return ATTENTION_TYPE_FOR_MODEL_MAPPING_NAMES[tuple(res)]
-    except KeyError:
-        raise ValueError("Unknown attention type")
+    return ATTENTION_TYPE_FOR_MODEL_MAPPING_NAMES[tuple(res)]
 
 
 def get_name_mapping(task="Model"):
@@ -860,7 +855,7 @@ def from_pretrained(cls, pretrained_model_name_or_path, *model_args, **kwargs):
                 )
         else:
             # Check whether the model use block attention
-            attn_type = get_attention_type(predictor_args.block_attn, predictor_args.speculate_attn)
+            attn_type = get_attention_type(predictor_args)
             model_name = f"{config.architectures[0]}{attn_type}"
 
         # Import the InferenceModel