diff --git a/scripts/evals/eval.py b/scripts/evals/eval.py index 236c80c4c..d5c6516ac 100644 --- a/scripts/evals/eval.py +++ b/scripts/evals/eval.py @@ -247,7 +247,7 @@ async def run_eval_pipeline( properties={ "result": { "type": "boolean", - "description": "The result of the eval", + "description": "Whether the answer is correct or not", }, "reasoning": { "type": "string",