1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
|
{
"command": "agbenchmark start --test=TestWriteFile --mock",
"benchmark_git_commit_sha": "---",
"agent_git_commit_sha": "---",
"completion_time": "2023-09-13T22:33:26+00:00",
"benchmark_start_time": "2023-09-13T22:29:46+00:00",
"metrics": {
"run_time": "219.16 seconds",
"highest_difficulty": "No successful tests",
"total_cost": null
},
"tests": {
"TestWriteFile": {
"data_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark/challenges/abilities/write_file/data.json",
"is_regression": false,
"category": [
"interface"
],
"task": "Write the word 'Washington' to a .txt file",
"answer": "The word 'Washington', printed to a .txt file named anything",
"description": "Tests the agents ability to write to a file",
"metrics": {
"difficulty": "interface",
"success": false,
"attempted": true,
"fail_reason": "assert 1 in []",
"success_%": 0.0,
"cost": null,
"run_time": "218.704 seconds"
},
"reached_cutoff": true
}
},
"config": {
"agent_benchmark_config_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark_config/config.json",
"workspace": {
"input": "auto_gpt_workspace",
"output": "auto_gpt_workspace"
},
"host": "http://localhost:8000"
}
}
|