We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4f4c115 commit c635a4bCopy full SHA for c635a4b
benchmarks/profiler/utils/profile_decode.py
@@ -41,12 +41,10 @@ def profile_decode(
41
(max_context_length - osl) // interpolation_granularity,
42
):
43
max_concurrency = max_kv_tokens // (isl + osl)
44
- sweep_num_request = list(
45
- range(
46
- 1,
47
- max_concurrency,
48
- max_concurrency // interpolation_granularity,
49
- )
+ sweep_num_request = range(
+ 1,
+ max_concurrency,
+ max_concurrency // interpolation_granularity,
50
)
51
for num_request in sweep_num_request:
52
genai_perf_artifact_dir = f"{work_dir}/gap_isl{isl}_osl{osl}_n{num_request}"
0 commit comments