@@ -35,6 +35,44 @@ class RunSummary(BaseModel):
35
35
total_tasks : int = Field (..., description = "Total number of executed tasks." )
36
36
37
37
38
+ class ModelSummary (BaseModel ):
39
+ model_name : str = Field (..., description = "Name of the LLM." )
40
+ avg_success_rate : float = Field (
41
+ ...,
42
+ description = "Percentage of successfully completed tasks across all repeats." ,
43
+ )
44
+ avg_total_tasks : float = Field (
45
+ ..., description = "Average number of tasks executed through all repeats."
46
+ )
47
+ avg_time : float = Field (
48
+ ..., description = "Average time taken across all tasks and repeats."
49
+ )
50
+
51
+ repeats : int = Field (
52
+ ..., description = "Total number of repeats for the model for each task."
53
+ )
54
+
55
+
56
+ class TasksSummary (BaseModel ):
57
+ model_name : str = Field (..., description = "Name of the LLM." )
58
+ avg_success_rate : float = Field (
59
+ ..., description = "Average result for task across all repeats."
60
+ )
61
+ std_success_rate : float = Field (
62
+ ..., description = "Standard deviation of the success rate across all repeats."
63
+ )
64
+ avg_time : float = Field (
65
+ ..., description = "Average time taken across all repeats for one task."
66
+ )
67
+ std_time : float = Field (
68
+ ...,
69
+ description = "Standard deviation of the time taken across all repeats for one task." ,
70
+ )
71
+ total_tasks : int = Field (
72
+ ..., description = "Total number of executed tasks across all repeats per task."
73
+ )
74
+
75
+
38
76
class TimeoutException (Exception ):
39
77
pass
40
78
0 commit comments