diff --git a/src/inference_endpoint/commands/benchmark/execute.py b/src/inference_endpoint/commands/benchmark/execute.py index 88e337f89..090f43e50 100644 --- a/src/inference_endpoint/commands/benchmark/execute.py +++ b/src/inference_endpoint/commands/benchmark/execute.py @@ -335,7 +335,16 @@ def _precompute_isl_for_multi_turn( return skipped = 0 first_failure_logged = False - for sample in dataloader.data or []: + samples = dataloader.data or [] + for sample in tqdm( + samples, + total=len(samples), + desc="Pre-computing ISL token counts", + unit="turn", + smoothing=0, + mininterval=2.0, + disable=not logger.isEnabledFor(logging.INFO), + ): messages = sample.get("messages") if not messages: continue