aboutsummaryrefslogtreecommitdiff
path: root/benchmark/agbenchmark_config/reports/20230913T234605_full_run/report.json
blob: 6f291a1e071eab938ef602733769e1fef9cc9d99 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
{
    "command": "agbenchmark start --test=TestWriteFile --mock",
    "benchmark_git_commit_sha": "---",
    "agent_git_commit_sha": "---",
    "completion_time": "2023-09-13T23:46:06+00:00",
    "benchmark_start_time": "2023-09-13T23:46:05+00:00",
    "metrics": {
        "run_time": "0.66 seconds",
        "highest_difficulty": "No successful tests",
        "total_cost": null
    },
    "tests": {
        "TestWriteFile": {
            "data_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark/challenges/abilities/write_file/data.json",
            "is_regression": false,
            "category": [
                "interface"
            ],
            "task": "Write the word 'Washington' to a .txt file",
            "answer": "The word 'Washington', printed to a .txt file named anything",
            "description": "Tests the agents ability to write to a file",
            "metrics": {
                "difficulty": "interface",
                "success": false,
                "attempted": true,
                "fail_reason": "cannot import name 'copy_artifacts_into_temp_workspace' from 'agbenchmark.agent_interface' (/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark/agent_interface.py)",
                "success_%": 0.0,
                "cost": null,
                "run_time": "0.187 seconds"
            },
            "reached_cutoff": false
        }
    },
    "config": {
        "agent_benchmark_config_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark_config/config.json",
        "host": "http://localhost:8000"
    }
}