@@ -531,18 +531,22 @@ async def benchmark(
531531 extra_body = extra_body ,
532532 )
533533
534- test_output = await wait_for_endpoint (
535- request_func ,
536- test_input ,
537- session ,
538- timeout_seconds = ready_check_timeout_sec ,
539- )
540- if not test_output .success :
541- raise ValueError (
542- "Initial test run failed - Please make sure benchmark arguments "
543- f"are correctly specified. Error: { test_output .error } " )
534+ if ready_check_timeout_sec > 0 :
535+ test_output = await wait_for_endpoint (
536+ request_func ,
537+ test_input ,
538+ session ,
539+ timeout_seconds = ready_check_timeout_sec ,
540+ )
541+ if not test_output .success :
542+ raise ValueError (
543+ "Initial test run failed - Please make sure benchmark "
544+ "arguments are correctly specified. "
545+ f"Error: { test_output .error } " )
546+ else :
547+ print ("Initial test run completed. Starting main benchmark run..." )
544548 else :
545- print ("Initial test run completed. Starting main benchmark run.. ." )
549+ print ("Skipping endpoint ready check ." )
546550
547551 if lora_modules :
548552 # For each input request, choose a LoRA module at random.
@@ -1151,7 +1155,8 @@ def add_cli_args(parser: argparse.ArgumentParser):
11511155 type = int ,
11521156 default = 600 ,
11531157 help = "Maximum time to wait for the endpoint to become ready "
1154- "in seconds (default: 600 seconds / 10 minutes)." ,
1158+ "in seconds (default: 600 seconds / 10 minutes). If set to 0, "
1159+ "the ready check will be skipped."
11551160 )
11561161
11571162
0 commit comments