@@ -266,7 +266,6 @@ async def evaluate(
266266 * ,
267267 task_name : str | None = None ,
268268 metadata : dict [str , Any ] | None = None ,
269- tags : Sequence [str ] | None = None ,
270269 ) -> EvaluationReport [InputsT , OutputT , MetadataT ]:
271270 """Evaluates the test cases in the dataset using the given task.
272271
@@ -286,7 +285,6 @@ async def evaluate(
286285 task_name: Optional override to the name of the task being executed, otherwise the name of the task
287286 function will be used.
288287 metadata: Optional dict of experiment metadata.
289- tags: Optional sequence of tags to add to the experiment span.
290288
291289 Returns:
292290 A report containing the results of the evaluation.
@@ -309,7 +307,6 @@ async def evaluate(
309307 dataset_name = self .name ,
310308 n_cases = len (self .cases ),
311309 ** extra_attributes ,
312- _tags = tags ,
313310 ) as eval_span ,
314311 progress_bar or nullcontext (),
315312 ):
@@ -354,8 +351,6 @@ async def _handle_case(case: Case[InputsT, OutputT, MetadataT], report_case_name
354351 full_experiment_metadata : dict [str , Any ] = {'n_cases' : len (self .cases )}
355352 if metadata is not None :
356353 full_experiment_metadata ['metadata' ] = metadata
357- if tags is not None :
358- full_experiment_metadata ['tags' ] = tags
359354 if (averages := report .averages ()) is not None :
360355 full_experiment_metadata ['averages' ] = averages
361356 if averages .assertions is not None :
@@ -374,7 +369,6 @@ def evaluate_sync(
374369 * ,
375370 task_name : str | None = None ,
376371 metadata : dict [str , Any ] | None = None ,
377- tags : Sequence [str ] | None = None ,
378372 ) -> EvaluationReport [InputsT , OutputT , MetadataT ]:
379373 """Evaluates the test cases in the dataset using the given task.
380374
@@ -393,7 +387,6 @@ def evaluate_sync(
393387 task_name: Optional override to the name of the task being executed, otherwise the name of the task
394388 function will be used.
395389 metadata: Optional dict of experiment metadata.
396- tags: Optional sequence of tags to add to the experiment span.
397390
398391 Returns:
399392 A report containing the results of the evaluation.
@@ -408,7 +401,6 @@ def evaluate_sync(
408401 retry_evaluators = retry_evaluators ,
409402 task_name = task_name ,
410403 metadata = metadata ,
411- tags = tags ,
412404 )
413405 )
414406
0 commit comments