We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent adf4745 commit 78e7868Copy full SHA for 78e7868
1 file changed
tests/pytest/test_markdown_highlighting.py
@@ -26,7 +26,7 @@ def markdown_dataset_to_evaluation_row(data: List[Dict[str, Any]]) -> List[Evalu
26
dataset_adapter=markdown_dataset_to_evaluation_row,
27
model=["accounts/fireworks/models/llama-v3p1-8b-instruct"],
28
rollout_input_params=[{"temperature": 0.0, "max_tokens": 4096}],
29
- threshold_of_success=1.0,
+ threshold_of_success=0.5,
30
rollout_processor=default_single_turn_rollout_processor,
31
num_runs=1,
32
mode="pointwise",
0 commit comments