aboutsummaryrefslogtreecommitdiff
path: root/benchmark/agbenchmark/challenges/verticals/scrape/4_revenue_retrieval_2/data.json
blob: 8ca61b9e74b98e56091a69b8efe4e27e98022853 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
{
    "category": [
        "scrape_synthesize"
    ],
    "cutoff": 60,
    "dependencies": [
        "TestRevenueRetrieval"
    ],
    "eval_id": "552bdf23-db40-4bd1-b123-4ed820886cc1",
    "ground": {
        "answer": "15 Millions\n112 Millions\n117 Millions\n204 Millions\n413 Millions\n2,014 Millions\n3,198 Millions\n4,046 Millions\n7,000 Millions\n11,759 Millions\n21,461 Millions\n24,578 Millions\n31,536 Millions\n53,823 Millions\n81,462 Millions",
        "eval": {
            "type": "file"
        },
        "files": [
            ".txt"
        ],
        "should_contain": [
          "15",
          "112",
          "117",
          "204",
          "413",
          "2,0",
          "3,198",
          "4,046",
          "7,000",
          "11,759",
          "21,461",
          "24,578",
          "31,536",
          "53,823",
          "81,462"
        ],
        "should_not_contain": []
    },
    "info": {
        "description": "Tests if the agent can retrieve all the revenues of Tesla since its creation.",
        "difficulty": "intermediate",
        "side_effects": [
            "tests if there is in fact an LLM attached"
        ]
    },
    "name": "RevenueRetrieval2",
    "task": "Write tesla's revenue every year since its creation into a .txt file. Use the US notation, with a precision rounded to the nearest million dollars (for instance, $31,578 million)."
}