diff options
Diffstat (limited to 'benchmark/agbenchmark/challenges/verticals/data/6_answer_question_combine_csv/data.json')
-rw-r--r-- | benchmark/agbenchmark/challenges/verticals/data/6_answer_question_combine_csv/data.json | 33 |
1 files changed, 33 insertions, 0 deletions
diff --git a/benchmark/agbenchmark/challenges/verticals/data/6_answer_question_combine_csv/data.json b/benchmark/agbenchmark/challenges/verticals/data/6_answer_question_combine_csv/data.json new file mode 100644 index 000000000..9f83f3a22 --- /dev/null +++ b/benchmark/agbenchmark/challenges/verticals/data/6_answer_question_combine_csv/data.json @@ -0,0 +1,33 @@ +{ + "category": [ + "data", + "general" + ], + "cutoff": 120, + "dependencies": [ + "TestAnswerQuestionCsv", + "TestCombineCsv" + ], + "eval_id": "b1bb61cd-3d09-4a69-bb2a-9dbb3c477589", + "ground": { + "answer": "The correct amount spent on utilities.", + "eval": { + "type": "file" + }, + "files": [ + "output.txt" + ], + "should_contain": [ + "1861" + ] + }, + "info": { + "description": "Tests if the agent can answer a question from a csv", + "difficulty": "intermediate", + "side_effects": [ + "" + ] + }, + "name": "AnswerQuestionCombineCsv", + "task": "How much was spent on utilities in total ? Write the answer in an output.txt file." +} |