aboutsummaryrefslogtreecommitdiff
path: root/benchmark/agbenchmark_config/reports/20230913T222946_full_run/report.json
blob: 6988f99ca9545a336536341354ec67561350c5dc (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
{
    "command": "agbenchmark start --test=TestWriteFile --mock",
    "benchmark_git_commit_sha": "---",
    "agent_git_commit_sha": "---",
    "completion_time": "2023-09-13T22:33:26+00:00",
    "benchmark_start_time": "2023-09-13T22:29:46+00:00",
    "metrics": {
        "run_time": "219.16 seconds",
        "highest_difficulty": "No successful tests",
        "total_cost": null
    },
    "tests": {
        "TestWriteFile": {
            "data_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark/challenges/abilities/write_file/data.json",
            "is_regression": false,
            "category": [
                "interface"
            ],
            "task": "Write the word 'Washington' to a .txt file",
            "answer": "The word 'Washington', printed to a .txt file named anything",
            "description": "Tests the agents ability to write to a file",
            "metrics": {
                "difficulty": "interface",
                "success": false,
                "attempted": true,
                "fail_reason": "assert 1 in []",
                "success_%": 0.0,
                "cost": null,
                "run_time": "218.704 seconds"
            },
            "reached_cutoff": true
        }
    },
    "config": {
        "agent_benchmark_config_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark_config/config.json",
        "workspace": {
            "input": "auto_gpt_workspace",
            "output": "auto_gpt_workspace"
        },
        "host": "http://localhost:8000"
    }
}