File tree Expand file tree Collapse file tree
mistralrs-cli/src/commands Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -102,6 +102,10 @@ pub async fn run_bench(
102102 }
103103 info ! ( "Warmup complete." ) ;
104104
105+ // Clear any residual KV cache from warmup
106+ let sender = mistralrs. get_sender ( None ) . unwrap ( ) ;
107+ let _ = sender. send ( mistralrs_core:: Request :: TerminateAllSeqsNextStep ) . await ;
108+
105109 // Reset logger counters so benchmark stats are clean
106110 if let Ok ( logger) = mistralrs. get_logger ( None ) {
107111 logger. reset ( ) ;
@@ -142,6 +146,10 @@ pub async fn run_bench(
142146 let ms_per_tok = 1000.0 / tok_per_sec;
143147 decode_results. push ( ( tok_per_sec, ms_per_tok) ) ;
144148 }
149+
150+ // Extremely aggressive cache sweep. Flush the sequences out of the engine.
151+ let sender = mistralrs. get_sender ( None ) . unwrap ( ) ;
152+ let _ = sender. send ( mistralrs_core:: Request :: TerminateAllSeqsNextStep ) . await ;
145153 }
146154
147155 // Calculate statistics
You can’t perform that action at this time.
0 commit comments