From 065b30618cb885523ef8cd554fb99303d0f154a1 Mon Sep 17 00:00:00 2001 From: Ren MinMin Date: Fri, 10 Jan 2025 07:41:08 +0000 Subject: [PATCH] [Misc] Update benchmark_prefix_caching.py fixed example usage Signed-off-by: Ren MinMin --- benchmarks/benchmark_prefix_caching.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/benchmarks/benchmark_prefix_caching.py b/benchmarks/benchmark_prefix_caching.py index 5e9381f712e10..3ab421a89c935 100644 --- a/benchmarks/benchmark_prefix_caching.py +++ b/benchmarks/benchmark_prefix_caching.py @@ -10,7 +10,8 @@ --model meta-llama/Llama-2-7b-chat-hf \ --enable-prefix-caching \ --num-prompts 1 \ - --repeat-count 100 + --repeat-count 100 \ + --input-length-range 128:256 ShareGPT example usage: # This command samples 20 prompts with input lengths