From 09f6a372921634a13b8dca5cac309b44aa767f9f Mon Sep 17 00:00:00 2001 From: Silen Naihin Date: Fri, 20 Oct 2023 07:21:41 -0700 Subject: fix capitalization, rename --- .../artifacts_out/output.txt | 1 + .../scrape/6_find_autogpt_creator/data.json | 33 +++++++++++++++++++++ .../6_find_cpo_microsoft/artifacts_out/output.txt | 1 - .../scrape/6_find_cpo_microsoft/data.json | 34 ---------------------- 4 files changed, 34 insertions(+), 35 deletions(-) create mode 100644 benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/artifacts_out/output.txt create mode 100644 benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/data.json delete mode 100644 benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/artifacts_out/output.txt delete mode 100644 benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/data.json (limited to 'benchmark') diff --git a/benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/artifacts_out/output.txt b/benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/artifacts_out/output.txt new file mode 100644 index 000000000..c37330ccc --- /dev/null +++ b/benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/artifacts_out/output.txt @@ -0,0 +1 @@ +Scotland \ No newline at end of file diff --git a/benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/data.json b/benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/data.json new file mode 100644 index 000000000..c3c069f2e --- /dev/null +++ b/benchmark/agbenchmark/challenges/verticals/scrape/6_find_autogpt_creator/data.json @@ -0,0 +1,33 @@ +{ + "category": [ + "scrape_synthesize", + "general" + ], + "cutoff": 60, + "dependencies": [ + "TestRevenueRetrieval" + ], + "eval_id": "1758058c-f726-484f-96fa-f05e278e5ff5", + "ground": { + "answer": "Toran is from Scotland https://uk.linkedin.com/in/toran-richards.", + "eval": { + "type": "file" + }, + "files": [ + "output.txt" + ], + "should_contain": [ + "cotland" + ], + "should_not_contain": [] + }, + "info": { + "description": "Tests if the agent can do multi step retrieval (1. who is the CEO of AutoGPT 2. find Toran is from)", + "difficulty": "intermediate", + "side_effects": [ + "" + ] + }, + "name": "TestAutoGPTCountry", + "task": "Write the country the the inventor/creator of AutoGPT is from to a file called output.txt" +} diff --git a/benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/artifacts_out/output.txt b/benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/artifacts_out/output.txt deleted file mode 100644 index c37330ccc..000000000 --- a/benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/artifacts_out/output.txt +++ /dev/null @@ -1 +0,0 @@ -Scotland \ No newline at end of file diff --git a/benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/data.json b/benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/data.json deleted file mode 100644 index 112df0cb8..000000000 --- a/benchmark/agbenchmark/challenges/verticals/scrape/6_find_cpo_microsoft/data.json +++ /dev/null @@ -1,34 +0,0 @@ -{ - "category": [ - "scrape_synthesize", - "general" - ], - "cutoff": 60, - "dependencies": [ - "TestRevenueRetrieval" - ], - "eval_id": "1758058c-f726-484f-96fa-f05e278e5ff5", - "ground": { - "answer": "Toran is from Scotland https://uk.linkedin.com/in/toran-richards.", - "eval": { - "type": "file" - }, - "files": [ - "output.txt" - ], - "should_contain": [ - "Scotland", - "scotland" - ], - "should_not_contain": [] - }, - "info": { - "description": "Tests if the agent can do multi step retrieval (1. who is the CEO of AutoGPT 2. find Toran is from)", - "difficulty": "intermediate", - "side_effects": [ - "" - ] - }, - "name": "TestAutoGPTCountry", - "task": "Write the country the the inventor/creator of AutoGPT is from to a file called output.txt" -} -- cgit v1.2.3