88import time
99import traceback
1010from dataclasses import dataclass , field
11- from typing import Optional , Union
1211
1312import aiohttp
1413import huggingface_hub .constants
@@ -28,13 +27,13 @@ class RequestFuncInput:
2827 prompt_len : int
2928 output_len : int
3029 model : str
31- model_name : Optional [ str ] = None
32- logprobs : Optional [ int ] = None
33- extra_body : Optional [ dict ] = None
34- multi_modal_content : Optional [ dict | list [dict ]] = None
30+ model_name : str | None = None
31+ logprobs : int | None = None
32+ extra_body : dict | None = None
33+ multi_modal_content : dict | list [dict ] | None = None
3534 ignore_eos : bool = False
36- language : Optional [ str ] = None
37- request_id : Optional [ str ] = None
35+ language : str | None = None
36+ request_id : str | None = None
3837
3938
4039@dataclass
@@ -52,7 +51,7 @@ class RequestFuncOutput:
5251
5352async def async_request_tgi (
5453 request_func_input : RequestFuncInput ,
55- pbar : Optional [ tqdm ] = None ,
54+ pbar : tqdm | None = None ,
5655) -> RequestFuncOutput :
5756 api_url = request_func_input .api_url
5857 assert api_url .endswith ("generate_stream" )
@@ -133,7 +132,7 @@ async def async_request_tgi(
133132
134133async def async_request_trt_llm (
135134 request_func_input : RequestFuncInput ,
136- pbar : Optional [ tqdm ] = None ,
135+ pbar : tqdm | None = None ,
137136) -> RequestFuncOutput :
138137 api_url = request_func_input .api_url
139138 assert api_url .endswith ("generate_stream" )
@@ -204,7 +203,7 @@ async def async_request_trt_llm(
204203
205204async def async_request_deepspeed_mii (
206205 request_func_input : RequestFuncInput ,
207- pbar : Optional [ tqdm ] = None ,
206+ pbar : tqdm | None = None ,
208207) -> RequestFuncOutput :
209208 api_url = request_func_input .api_url
210209 assert api_url .endswith (("completions" , "profile" )), (
@@ -267,7 +266,7 @@ async def async_request_deepspeed_mii(
267266
268267async def async_request_openai_completions (
269268 request_func_input : RequestFuncInput ,
270- pbar : Optional [ tqdm ] = None ,
269+ pbar : tqdm | None = None ,
271270) -> RequestFuncOutput :
272271 api_url = request_func_input .api_url
273272 assert api_url .endswith (("completions" , "profile" )), (
@@ -367,7 +366,7 @@ async def async_request_openai_completions(
367366
368367async def async_request_openai_chat_completions (
369368 request_func_input : RequestFuncInput ,
370- pbar : Optional [ tqdm ] = None ,
369+ pbar : tqdm | None = None ,
371370) -> RequestFuncOutput :
372371 api_url = request_func_input .api_url
373372 assert api_url .endswith (("chat/completions" , "profile" )), (
@@ -476,7 +475,7 @@ async def async_request_openai_chat_completions(
476475
477476async def async_request_openai_audio (
478477 request_func_input : RequestFuncInput ,
479- pbar : Optional [ tqdm ] = None ,
478+ pbar : tqdm | None = None ,
480479) -> RequestFuncOutput :
481480 # Lazy import without PlaceholderModule to avoid vllm dep.
482481 import soundfile
@@ -610,7 +609,7 @@ def get_tokenizer(
610609 tokenizer_mode : str = "auto" ,
611610 trust_remote_code : bool = False ,
612611 ** kwargs ,
613- ) -> Union [ PreTrainedTokenizer , PreTrainedTokenizerFast ] :
612+ ) -> PreTrainedTokenizer | PreTrainedTokenizerFast :
614613 if pretrained_model_name_or_path is not None and not os .path .exists (
615614 pretrained_model_name_or_path
616615 ):
0 commit comments