@@ -310,7 +310,7 @@ def evaluation_test( # noqa: C901
310310 steps: Number of rollout steps to execute (default: 30).
311311 mode: Evaluation mode. "pointwise" (default) applies test function to each row (rollout result).
312312 "groupwise" applies test function to a group of rollout results from the same original row (for use cases such as dpo/grpo).
313- "listwise " applies test function to the whole dataset.
313+ "all " applies test function to the whole dataset.
314314 logger: DatasetLogger to use for logging. If not provided, a default logger will be used.
315315 """
316316
@@ -349,29 +349,29 @@ def decorator(
349349 # additional check for groupwise evaluation
350350 elif mode == "groupwise" :
351351 if "rows" not in sig .parameters :
352- raise ValueError ("In listwise mode, your eval function must have a parameter named 'rows'" )
352+ raise ValueError ("In groupwise mode, your eval function must have a parameter named 'rows'" )
353353
354354 # validate that "Rows" is of type List[EvaluationRow]
355355 if sig .parameters ["rows" ].annotation is not List [EvaluationRow ]:
356- raise ValueError ("In listwise mode, the 'rows' parameter must be of type List[EvaluationRow" )
356+ raise ValueError ("In groupwise mode, the 'rows' parameter must be of type List[EvaluationRow" )
357357
358358 # validate that the function has a return type of List[EvaluationRow]
359359 if sig .return_annotation is not List [EvaluationRow ]:
360- raise ValueError ("In listwise mode, your eval function must return a list of EvaluationRow instances" )
360+ raise ValueError ("In groupwise mode, your eval function must return a list of EvaluationRow instances" )
361361 if len (completion_params ) < 2 :
362362 raise ValueError ("In groupwise mode, you must provide at least 2 completion parameters" )
363363 else :
364- # listwise mode: function should accept input_dataset and model
364+ # all mode: function should accept input_dataset and model
365365 if "rows" not in sig .parameters :
366- raise ValueError ("In batch mode, your eval function must have a parameter named 'rows'" )
366+ raise ValueError ("In all mode, your eval function must have a parameter named 'rows'" )
367367
368368 # validate that "Rows" is of type List[EvaluationRow]
369369 if sig .parameters ["rows" ].annotation is not List [EvaluationRow ]:
370- raise ValueError ("In batch mode, the 'rows' parameter must be of type List[EvaluationRow" )
370+ raise ValueError ("In all mode, the 'rows' parameter must be of type List[EvaluationRow" )
371371
372372 # validate that the function has a return type of List[EvaluationRow]
373373 if sig .return_annotation is not List [EvaluationRow ]:
374- raise ValueError ("In listwise mode, your eval function must return a list of EvaluationRow instances" )
374+ raise ValueError ("In all mode, your eval function must return a list of EvaluationRow instances" )
375375
376376 async def execute_with_params (
377377 test_func : TestFunction ,
@@ -434,7 +434,7 @@ async def execute_with_params(
434434 param_tuple .append (etk )
435435 param_tuples .append (tuple (param_tuple ))
436436
437- # For listwise mode, preserve the original parameter names
437+ # For all mode, preserve the original parameter names
438438 test_param_names = []
439439 if input_dataset is not None :
440440 test_param_names .append ("dataset_path" )
0 commit comments