1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
|
{
"command": "agbenchmark start --test=TestWriteFile --mock",
"benchmark_git_commit_sha": "---",
"agent_git_commit_sha": "---",
"completion_time": "2023-09-13T23:46:06+00:00",
"benchmark_start_time": "2023-09-13T23:46:05+00:00",
"metrics": {
"run_time": "0.66 seconds",
"highest_difficulty": "No successful tests",
"total_cost": null
},
"tests": {
"TestWriteFile": {
"data_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark/challenges/abilities/write_file/data.json",
"is_regression": false,
"category": [
"interface"
],
"task": "Write the word 'Washington' to a .txt file",
"answer": "The word 'Washington', printed to a .txt file named anything",
"description": "Tests the agents ability to write to a file",
"metrics": {
"difficulty": "interface",
"success": false,
"attempted": true,
"fail_reason": "cannot import name 'copy_artifacts_into_temp_workspace' from 'agbenchmark.agent_interface' (/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark/agent_interface.py)",
"success_%": 0.0,
"cost": null,
"run_time": "0.187 seconds"
},
"reached_cutoff": false
}
},
"config": {
"agent_benchmark_config_path": "/Users/merwanehamadi/code/Auto-GPT/benchmark/agbenchmark_config/config.json",
"host": "http://localhost:8000"
}
}
|