feat: UTC-563: Annotations per task coverage percentage distributed randomly (#9374)

mcanu · web-flow · commit 6b1eb7aa0163 · 2026-02-12T20:33:20.000+04:00
Co-authored-by: mcanu &lt;mcanu@users.noreply.github.com&gt;
diff --git a/label_studio/projects/models.py b/label_studio/projects/models.py
@@ -6,6 +6,7 @@
 
 from annoying.fields import AutoOneToOneField
 from core.current_request import CurrentContext
+from core.feature_flags import flag_set
 from core.label_config import (
     check_control_in_config_by_regex,
     check_toname_in_config_by_regex,
@@ -576,17 +577,24 @@ def _rearrange_overlap_cohort(self):
                 all_project_tasks.filter(id__in=ids), overlap=max_annotations, is_labeled=True
             )
             # order other tasks by count(annotations)
-            tasks_with_min_annotations = (
-                tasks_with_min_annotations.annotate(anno=Count('annotations')).order_by('-anno').distinct()
-            )
+            tasks_with_min_annotations = tasks_with_min_annotations.annotate(annotation_count=Count('annotations'))
+            if flag_set('fflag_feat_utc_563_randomize_overlap_cohort', user='auto'):
+                # Randomize within tie groups so cohort selection isn't deterministic.
+                # If there are many tasks with the same annotation count, their order is random.
+                tasks_with_min_annotations = tasks_with_min_annotations.order_by('-annotation_count', '?')
+            else:
+                tasks_with_min_annotations = tasks_with_min_annotations.order_by('-annotation_count').distinct()
+
+            # Materialize the full ID list once to ensure consistent ordering across slices, instead of slicing twice with random ordering.
+            all_min_ids = list(tasks_with_min_annotations.values_list('id', flat=True))
+            cohort_ids = all_min_ids[:left_must_tasks]
+            remaining_ids = all_min_ids[left_must_tasks:]
+
             # assign overlap depending on annotation count
             # assign max_annotations and update is_labeled
-            ids = list(tasks_with_min_annotations[:left_must_tasks].values_list('id', flat=True))
-            self._batch_update_with_retry(all_project_tasks.filter(id__in=ids), overlap=max_annotations)
+            self._batch_update_with_retry(all_project_tasks.filter(id__in=cohort_ids), overlap=max_annotations)
             # assign 1 to left
-            ids = list(tasks_with_min_annotations[left_must_tasks:].values_list('id', flat=True))
-            min_tasks_to_update = all_project_tasks.filter(id__in=ids)
-            self._batch_update_with_retry(min_tasks_to_update, overlap=1)
+            self._batch_update_with_retry(all_project_tasks.filter(id__in=remaining_ids), overlap=1)
         else:
             ids = list(tasks_with_max_annotations.values_list('id', flat=True))
             self._batch_update_with_retry(all_project_tasks.filter(id__in=ids), overlap=max_annotations)
diff --git a/label_studio/projects/tests/test_models.py b/label_studio/projects/tests/test_models.py
@@ -0,0 +1,102 @@
+"""Tests for projects.models (Project model and related logic)."""
+from django.test import TestCase
+from projects.tests.factories import ProjectFactory
+from tasks.models import Task
+from tasks.tests.factories import AnnotationFactory, TaskFactory
+from tests.utils import mock_feature_flag
+
+
+class TestRearrangeOverlapCohort(TestCase):
+    """
+    Tests for Project._rearrange_overlap_cohort().
+
+    Covers overlap cohort assignment when overlap_cohort_percentage < 100:
+    correct cohort size, deterministic vs random tie-breaking (feature flag),
+    and prioritization of tasks with more annotations (progress preservation).
+    """
+
+    @mock_feature_flag('fflag_feat_utc_563_randomize_overlap_cohort', True, parent_module='projects.models')
+    def test_randomize_when_flag_on(self):
+        """
+        With fflag_feat_utc_563_randomize_overlap_cohort on, cohort selection
+        varies across runs because tie-breaking within same annotation count
+        is random. Expected: at least 2 distinct cohort ID sets over 10 runs,
+        and cohort size always equals must_tasks.
+        """
+        num_tasks = 20
+        overlap_cohort_pct = 25
+        expected_cohort_size = int(num_tasks * overlap_cohort_pct / 100 + 0.5)  # 5
+        project = ProjectFactory(
+            maximum_annotations=2,
+            overlap_cohort_percentage=overlap_cohort_pct,
+        )
+        TaskFactory.create_batch(num_tasks, project=project)
+
+        cohorts_seen = set()
+        for _ in range(10):
+            project._rearrange_overlap_cohort()
+            cohort_ids = frozenset(Task.objects.filter(project=project, overlap__gt=1).values_list('id', flat=True))
+            assert len(cohort_ids) == expected_cohort_size
+            cohorts_seen.add(cohort_ids)
+        assert len(cohorts_seen) >= 2, 'Random tie-breaking should produce at least 2 different cohorts over 10 runs'
+
+    @mock_feature_flag('fflag_feat_utc_563_randomize_overlap_cohort', False, parent_module='projects.models')
+    def test_deterministic_when_flag_off(self):
+        """
+        With fflag_feat_utc_563_randomize_overlap_cohort off, cohort selection
+        is deterministic. Expected: two consecutive runs yield the same cohort
+        ID set and correct cohort size.
+        """
+        num_tasks = 20
+        overlap_cohort_pct = 25
+        expected_cohort_size = int(num_tasks * overlap_cohort_pct / 100 + 0.5)
+        project = ProjectFactory(
+            maximum_annotations=2,
+            overlap_cohort_percentage=overlap_cohort_pct,
+        )
+        TaskFactory.create_batch(num_tasks, project=project)
+
+        project._rearrange_overlap_cohort()
+        cohort_first = frozenset(Task.objects.filter(project=project, overlap__gt=1).values_list('id', flat=True))
+        project._rearrange_overlap_cohort()
+        cohort_second = frozenset(Task.objects.filter(project=project, overlap__gt=1).values_list('id', flat=True))
+        assert len(cohort_first) == expected_cohort_size
+        assert cohort_first == cohort_second
+
+    @mock_feature_flag('fflag_feat_utc_563_randomize_overlap_cohort', True, parent_module='projects.models')
+    def test_preserves_progress_when_flag_on(self):
+        """
+        Tasks with more finished annotations are prioritized into the cohort
+        (progress preserved). With flag on, only tie-breaking is random.
+        Expected: tasks that already have one annotation are in the cohort.
+        """
+        num_tasks = 10
+        overlap_cohort_pct = 30
+        expected_cohort_size = int(num_tasks * overlap_cohort_pct / 100 + 0.5)  # 3
+        project = ProjectFactory(
+            maximum_annotations=2,
+            overlap_cohort_percentage=overlap_cohort_pct,
+        )
+        tasks = TaskFactory.create_batch(num_tasks, project=project)
+        for t in tasks[:2]:
+            AnnotationFactory(
+                task=t,
+                project=project,
+                result=[
+                    {
+                        'value': {'choices': ['A']},
+                        'from_name': 'text_class',
+                        'to_name': 'text',
+                        'type': 'choices',
+                    }
+                ],
+                was_cancelled=False,
+                ground_truth=False,
+            )
+
+        project._rearrange_overlap_cohort()
+
+        cohort_ids = set(Task.objects.filter(project=project, overlap__gt=1).values_list('id', flat=True))
+        assert len(cohort_ids) == expected_cohort_size
+        assert tasks[0].id in cohort_ids
+        assert tasks[1].id in cohort_ids