Skip to content

Commit f785514

Browse files
committed
add postprocess
1 parent fae3150 commit f785514

2 files changed

Lines changed: 11 additions & 1 deletion

File tree

eval_protocol/pytest/evaluation_test.py

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -438,6 +438,17 @@ def _log_eval_error(status: Status, rows: list[EvaluationRow] | None, passed: bo
438438
all_results[run_idx].append(res)
439439

440440
processed_rows_in_run.append(res)
441+
postprocess(
442+
all_results,
443+
aggregation_method,
444+
passed_threshold,
445+
active_logger,
446+
mode,
447+
completion_params, # pyright: ignore[reportArgumentType]
448+
test_func.__name__,
449+
num_runs,
450+
time.perf_counter() - experiment_start_time,
451+
)
441452

442453
else:
443454
async def execute_run(run_idx: int, config: RolloutProcessorConfig):

tests/pytest/test_rollout_scheduler.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,6 @@
22
from eval_protocol.models import EvaluationRow, Message, EvaluateResult, InputMetadata
33
from typing import List
44

5-
65
@evaluation_test(
76
completion_params=[{"model": "fireworks_ai/accounts/fireworks/models/gpt-oss-120b"}],
87
input_rows=[

0 commit comments

Comments
 (0)