Skip to content

Commit cf08dbe

Browse files
tedzhouhkhhzhang16
authored andcommitted
fix: missing tokenizer args in sla_planner.py (#2667)
Signed-off-by: Hannah Zhang <hannahz@nvidia.com>
1 parent 30d141c commit cf08dbe

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

benchmarks/profiler/profile_sla.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -154,7 +154,11 @@ async def run_profile(args):
154154
base_url = client.get_service_url()
155155
genai_perf_artifact_dir = f"{work_dir}/gap_isl{args.isl}"
156156
gap_result = benchmark_prefill(
157-
args.isl, genai_perf_artifact_dir, model_name, base_url=base_url
157+
args.isl,
158+
genai_perf_artifact_dir,
159+
model_name,
160+
model_name,
161+
base_url=base_url,
158162
)
159163
if gap_result is not None:
160164
ttft = gap_result["time_to_first_token"]["avg"]
@@ -279,6 +283,7 @@ async def run_profile(args):
279283
num_request,
280284
genai_perf_artifact_dir,
281285
model_name,
286+
model_name,
282287
base_url=base_url,
283288
)
284289
if gap_result is not None:

0 commit comments

Comments
 (0)