From 1aa8cee743b50d8fbff4e1ddc5260adfe773b9b8 Mon Sep 17 00:00:00 2001 From: James Woffinden-Luey Date: Thu, 9 May 2024 09:04:59 -0700 Subject: [PATCH] fixing test file --- .../samples/sample_math_criteria.json | 50 +++++++++---------- 1 file changed, 25 insertions(+), 25 deletions(-) diff --git a/test/test_files/agenteval-in-out/samples/sample_math_criteria.json b/test/test_files/agenteval-in-out/samples/sample_math_criteria.json index e7ba165465c..c163a502c2f 100644 --- a/test/test_files/agenteval-in-out/samples/sample_math_criteria.json +++ b/test/test_files/agenteval-in-out/samples/sample_math_criteria.json @@ -1,26 +1,26 @@ -{ - "Problem Interpretation": { - "description": "Ability to correctly interpret the problem.", - "accepted_values": ["completely off", "slightly relevant", "relevant", "mostly accurate", "completely accurate"] - }, - "Mathematical Methodology": { - "description": "Adequacy of the chosen mathematical or algorithmic methodology for the question", - "accepted_values": ["inappropriate", "barely adequate", "adequate", "mostly effective", "completely effective"] - }, - "Calculation Correctness": { - "description": "Accuracy of calculations made and solutions given", - "accepted_values": ["completely incorrect", "mostly incorrect", "neither", "mostly correct", "completely correct"] - }, - "Explanation Clarity": { - "description": "Clarity and comprehensibility of explanations, including language use and structure", - "accepted_values": ["not at all clear", "slightly clear", "moderately clear", "very clear", "completely clear"] - }, - "Code Efficiency": { - "description": "Quality of code in terms of efficiency and elegance", - "accepted_values": ["not at all efficient", "slightly efficient", "moderately efficient", "very efficient", "extremely efficient"] - }, - "Code Correctness": { - "description": "Correctness of the provided code", - "accepted_values": ["completely incorrect", "mostly incorrect", "partly correct", "mostly correct", "completely correct"] - } +[ + { "name": "Problem Interpretation", + "description": "Ability to correctly interpret the problem.", + "accepted_values": ["completely off", "slightly relevant", "relevant", "mostly accurate", "completely accurate"] + }, + { "name": "Mathematical Methodology", + "description": "Adequacy of the chosen mathematical or algorithmic methodology for the question", + "accepted_values": ["inappropriate", "barely adequate", "adequate", "mostly effective", "completely effective"] + }, + { "name": "Calculation Correctness", + "description": "Accuracy of calculations made and solutions given", + "accepted_values": ["completely incorrect", "mostly incorrect", "neither", "mostly correct", "completely correct"] + }, + { "name": "Explanation Clarity", + "description": "Clarity and comprehensibility of explanations, including language use and structure", + "accepted_values": ["not at all clear", "slightly clear", "moderately clear", "very clear", "completely clear"] + }, + { "name": "Code Efficiency", + "description": "Quality of code in terms of efficiency and elegance", + "accepted_values": ["not at all efficient", "slightly efficient", "moderately efficient", "very efficient", "extremely efficient"] + }, + { "name": "Code Correctness", + "description": "Correctness of the provided code", + "accepted_values": ["completely incorrect", "mostly incorrect", "partly correct", "mostly correct", "completely correct"] } +]