mapswipe
diff --git a/‎apps/project/exports/mapping_results_aggregate/tests/__init__.py‎ b/‎apps/project/exports/mapping_results_aggregate/tests/__init__.py‎
diff --git a/‎apps/project/exports/mapping_results_aggregate/tests/task_test.py‎
Lines changed: 168 additions & 0 deletions b/‎apps/project/exports/mapping_results_aggregate/tests/task_test.py‎
Lines changed: 168 additions & 0 deletions
diff --git a/‎assets‎ b/‎assets‎
diff --git a/‎project_types/street/api_calls.py‎
Lines changed: 23 additions & 6 deletions b/‎project_types/street/api_calls.py‎
Lines changed: 23 additions & 6 deletions
diff --git a/‎project_types/street/tests/__init__.py‎ b/‎project_types/street/tests/__init__.py‎
@@ -0,0 +1,168 @@
+import pandas as pd
+
+from apps.project.exports.mapping_results_aggregate.task import (
+    _add_missing_result_columns,  # type: ignore[reportPrivateUsage]
+    _calc_agreement,  # type: ignore[reportPrivateUsage]
+    _calc_count,  # type: ignore[reportPrivateUsage]
+    _calc_parent_option_count,  # type: ignore[reportPrivateUsage]
+    _calc_share,  # type: ignore[reportPrivateUsage]
+    _get_custom_options,  # type: ignore[reportPrivateUsage]
+)
+from main.tests import TestCase
+
+
+class TestProjectStats(TestCase):
+    def test_calc_agreement(self):
+        ds = pd.Series(
+            data=[40, 15, 5, 17, 3],
+            index=["total_count", "1_count", "2_count", "3_count", "4_count"],
+        )
+        agg2 = _calc_agreement(ds)
+        assert agg2 == 0.32564102564102565
+
+    def test_calc_count(self):
+        df = pd.DataFrame(
+            data=[[1, 15, 5, 20], [1, 234, 45, 6]],
+            columns=["taskId", "1_count", "2_count", "3_count"],
+        )
+        result = _calc_count(df)
+        assert result[0] == 40
+
+    def test_calc_share(self):
+        df = pd.DataFrame(
+            data=[[1, 40, 15, 5, 20], [1, 285, 234, 45, 6]],
+            columns=["taskId", "total_count", "1_count", "2_count", "3_count"],
+        )
+        share = _calc_share(df)
+        assert share.filter(like="share").iloc[0].tolist() == [0.375, 0.125, 0.5]
+
+    def test_get_custom_options(self):
+        for raw_custom_options, excepted_values in [
+            (
+                [{"value": 0}, {"value": 1}, {"value": 2}, {"value": 3}],
+                {0: set(), 1: set(), 2: set(), 3: set()},
+            ),
+            (
+                [
+                    {
+                        "value": 0,
+                        "subOptions": [{"value": 4}, {"value": 5}],
+                    },
+                    {"value": 1},
+                    {"value": 2},
+                    {"value": 3},
+                ],
+                {0: {4, 5}, 1: set(), 2: set(), 3: set()},
+            ),
+            (
+                [
+                    {
+                        "value": 0,
+                        "subOptions": [{"value": 4}, {"value": 5}],
+                    },
+                    {"value": 1},
+                    {"value": 2},
+                    {
+                        "value": 3,
+                        "subOptions": [{"value": 10}, {"value": 12}],
+                    },
+                ],
+                {0: {4, 5}, 1: set(), 2: set(), 3: {10, 12}},
+            ),
+        ]:
+            parsed_custom_options = _get_custom_options(raw_custom_options)
+            assert parsed_custom_options == excepted_values
+
+    def test_add_missing_result_columns(self):
+        df = pd.DataFrame(
+            data=[
+                ["project-1-group-1-task-1", 1],
+                ["project-1-group-1-task-1", 5],
+                ["project-1-group-2-task-1", 1],
+                ["project-1-group-2-task-1", 1],
+                ["project-1-group-2-task-1", 1],
+                ["project-2-group-3-task-1", 2],
+                ["project-2-group-1-task-1", 3],
+            ],
+            columns=[
+                "task_id",
+                "result",
+            ],
+        )
+        df = df.groupby(["task_id", "result"]).size().unstack(fill_value=0)
+        updated_df = _add_missing_result_columns(
+            df,
+            {
+                1: {4, 5},
+                2: {6},
+                3: set(),
+            },
+        )
+        # Existing columns
+        assert list(df.columns) == [1, 2, 3, 5]
+        # New columns
+        assert list(updated_df.columns) == [1, 2, 3, 4, 5, 6]
+        # Existing data
+        assert df.to_csv() == (
+            "task_id,1,2,3,5\n"
+            "project-1-group-1-task-1,1,0,0,1\n"
+            "project-1-group-2-task-1,3,0,0,0\n"
+            "project-2-group-1-task-1,0,0,1,0\n"
+            "project-2-group-3-task-1,0,1,0,0\n"
+        )
+        # New data
+        assert updated_df.to_csv() == (
+            "task_id,1,2,3,4,5,6\n"
+            "project-1-group-1-task-1,1,0,0,0,1,0\n"
+            "project-1-group-2-task-1,3,0,0,0,0,0\n"
+            "project-2-group-1-task-1,0,0,1,0,0,0\n"
+            "project-2-group-3-task-1,0,1,0,0,0,0\n"
+        )
+
+    def test_calc_parent_option_count(self):
+        df = pd.DataFrame(
+            data=[
+                [1, 40, 1, 0, 20, 0, 1, 0],
+                [2, 41, 0, 5, 20, 0, 0, 0],
+                [3, 42, 10, 10, 20, 0, 0, 1],
+                [4, 281, 0, 1, 0, 1, 1, 4],
+                [5, 282, 15, 10, 0, 1, 2, 4],
+                [1, 283, 2, 20, 0, 1, 0, 0],
+            ],
+            columns=[
+                "taskId",
+                "total_count",
+                "1_count",
+                "2_count",
+                "3_count",
+                "4_count",  # Child of 1
+                "5_count",  # Child of 1
+                "6_count",  # Child of 2
+            ],
+        )
+        updated_df = _calc_parent_option_count(
+            df,
+            {
+                1: {4, 5},
+                2: {6},
+                3: set(),
+            },
+        )
+        # Columns without child shouldn't change
+        for column in [
+            "taskId",
+            "total_count",
+            "3_count",
+            "4_count",
+            "5_count",
+            "6_count",
+        ]:
+            assert df[column].compare(updated_df[column]).size == 0
+        # Columns with child should change
+        for column, updated_index, updated_value in [
+            ("1_count", [0, 3, 4, 5], [2, 2, 18, 3]),
+            ("2_count", [2, 3, 4], [11, 5, 14]),
+        ]:
+            compared = df[column].compare(updated_df[column])
+            assert list(compared["other"].index) == updated_index
+            assert list(compared["other"]) == updated_value
@@ -8,6 +8,7 @@
 import mercantile  # type: ignore[reportMissingTypeStubs]
 import pandas as pd
 import requests
+from geojson_pydantic import Feature as PydanticFeature
 from geojson_pydantic import FeatureCollection as PydanticFeatureCollection
 from geojson_pydantic.geometries import MultiPolygon as PydanticMultiPolygon
 from geojson_pydantic.geometries import Polygon as PydanticPolygon
@@ -73,17 +74,33 @@ def create_tiles(
 
 # FIXME: move this to utils
 def geojson_to_polygon(geojson_data: dict[str, Any]):
+    fc: PydanticFeatureCollection[Any] | None
+    try:
+        feature = PydanticFeature(**geojson_data)
+        fc = PydanticFeatureCollection(
+            type="FeatureCollection",
+            features=[feature],
+        )
+    except ValidationError:
+        fc = None
+
     # NOTE: We might not need this, as we already check this
     try:
-        fc = PydanticFeatureCollection(**geojson_data)
+        if not fc:
+            fc = PydanticFeatureCollection(**geojson_data)
     except ValidationError as e:
         raise ValidationException("Invalid GeoJSON FeatureCollection") from e
 
     polygon_types = (PydanticPolygon, PydanticMultiPolygon)
-    geometries = [shape(feature.geometry) for feature in fc.features if isinstance(feature.geometry, polygon_types)]
 
-    if not geometries:
-        raise ValidationException("No valid Polygon or MultiPolygon found in the GeoJSON FeatureCollection")
+    has_invalid_geometries = any(not isinstance(feature.geometry, polygon_types) for feature in fc.features)
+    if has_invalid_geometries:
+        raise ValidationException("Non-polygon geometries cannot be combined into a MultiPolygon.")
+
+    geometries = [shape(feature.geometry) for feature in fc.features]
+
+    # if not geometries:
+    #     raise ValidationException("No valid Polygon or MultiPolygon found in the GeoJSON FeatureCollection")
 
     return unary_union(geometries)
 
@@ -140,7 +157,7 @@ def parallelized_processing(
 
 def download_and_process_tile(
     *,
-    row: dict[Hashable, Any],
+    row: dict[Hashable, Any] | pd.Series,
     polygon: ShapelyBaseGeometry,
     kwargs: dict[str, Any],
     attempt_limit: int = 3,
@@ -219,7 +236,7 @@ def filter_results(
     results_df: pd.DataFrame,
     creator_id: int | None = None,
     is_pano: bool | None = None,
-    organization_id: str | None = None,
+    organization_id: int | None = None,
     start_time: str | None = None,
     end_time: str | None = None,
 ):