Skip to content

Commit bee986c

Browse files
tedzhouhknnshah1
authored andcommitted
fix: missing tokenizer args in sla_planner.py (#2667)
Signed-off-by: nnshah1 <neelays@nvidia.com>
1 parent 893ff49 commit bee986c

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

benchmarks/profiler/profile_sla.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -158,7 +158,11 @@ async def run_profile(args):
158158
base_url = client.get_service_url()
159159
genai_perf_artifact_dir = f"{work_dir}/gap_isl{args.isl}"
160160
gap_result = benchmark_prefill(
161-
args.isl, genai_perf_artifact_dir, model_name, base_url=base_url
161+
args.isl,
162+
genai_perf_artifact_dir,
163+
model_name,
164+
model_name,
165+
base_url=base_url,
162166
)
163167
if gap_result is not None:
164168
ttft = gap_result["time_to_first_token"]["avg"]
@@ -283,6 +287,7 @@ async def run_profile(args):
283287
num_request,
284288
genai_perf_artifact_dir,
285289
model_name,
290+
model_name,
286291
base_url=base_url,
287292
)
288293
if gap_result is not None:

0 commit comments

Comments
 (0)