Skip to content

Commit 1505018

Browse files
committed
final
1 parent df26606 commit 1505018

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

tests/test_tau_bench_airline_smoke.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -68,7 +68,7 @@ def tau_bench_airline_smoke_to_evaluation_row(data: List[Dict[str, Any]]) -> Lis
6868
model=["fireworks_ai/accounts/fireworks/models/gpt-oss-120b"],
6969
rollout_input_params=[{"temperature": 0.8, "extra_body": {"reasoning_effort": "medium"}}],
7070
rollout_processor=default_mcp_gym_rollout_processor,
71-
passed_threshold=0.4,
71+
passed_threshold=0.36,
7272
num_runs=1, # Smoke test: single run for quick feedback
7373
mode="pointwise",
7474
max_concurrent_rollouts=50, # Standard concurrency

0 commit comments

Comments
 (0)