From 46f33645aa2c1bff7cf4b0e73876cd75e2ab79d0 Mon Sep 17 00:00:00 2001 From: minmin Date: Sat, 11 Jan 2025 04:39:22 +0800 Subject: [PATCH] [Misc] Update benchmark_prefix_caching.py fixed example usage (#11920) Signed-off-by: Ren MinMin Co-authored-by: Ren MinMin --- benchmarks/benchmark_prefix_caching.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/benchmarks/benchmark_prefix_caching.py b/benchmarks/benchmark_prefix_caching.py index 5e9381f712e10..3ab421a89c935 100644 --- a/benchmarks/benchmark_prefix_caching.py +++ b/benchmarks/benchmark_prefix_caching.py @@ -10,7 +10,8 @@ --model meta-llama/Llama-2-7b-chat-hf \ --enable-prefix-caching \ --num-prompts 1 \ - --repeat-count 100 + --repeat-count 100 \ + --input-length-range 128:256 ShareGPT example usage: # This command samples 20 prompts with input lengths