aboutsummaryrefslogtreecommitdiff
path: root/frontend/lib/services/benchmark_service.dart
blob: e58ae40c83e458eff419087de1be6e14cf264132 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
import 'dart:async';
import 'package:auto_gpt_flutter_client/models/benchmark/benchmark_step_request_body.dart';
import 'package:auto_gpt_flutter_client/models/benchmark/benchmark_task_request_body.dart';
import 'package:auto_gpt_flutter_client/utils/rest_api_utility.dart';
import 'package:auto_gpt_flutter_client/models/benchmark/api_type.dart';

class BenchmarkService {
  final RestApiUtility api;

  BenchmarkService(this.api);

  /// Creates a new benchmark task.
  ///
  /// [benchmarkTaskRequestBody] is a Map representing the request body for creating a task.
  Future<Map<String, dynamic>> createBenchmarkTask(
      BenchmarkTaskRequestBody benchmarkTaskRequestBody) async {
    try {
      return await api.post('agent/tasks', benchmarkTaskRequestBody.toJson(),
          apiType: ApiType.benchmark);
    } catch (e) {
      throw Exception('Failed to create a new task: $e');
    }
  }

  /// Executes a step in a specific benchmark task.
  ///
  /// [taskId] is the ID of the task.
  /// [benchmarkStepRequestBody] is a Map representing the request body for executing a step.
  Future<Map<String, dynamic>> executeBenchmarkStep(
      String taskId, BenchmarkStepRequestBody benchmarkStepRequestBody) async {
    try {
      return await api.post(
          'agent/tasks/$taskId/steps', benchmarkStepRequestBody.toJson(),
          apiType: ApiType.benchmark);
    } catch (e) {
      throw Exception('Failed to execute step: $e');
    }
  }

  /// Triggers an evaluation for a specific benchmark task.
  ///
  /// [taskId] is the ID of the task.
  Future<Map<String, dynamic>> triggerEvaluation(String taskId) async {
    try {
      return await api.post('agent/tasks/$taskId/evaluations', {},
          apiType: ApiType.benchmark);
    } catch (e) {
      throw Exception('Failed to trigger evaluation: $e');
    }
  }
}